From cbf0e1dab0edc896f70b14163d5a5f7cbd7eaa40 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Wed, 22 Nov 2023 08:05:52 +0900 Subject: [PATCH 01/51] Enhance maximum value of DepthU to 1024 (#1821) - changed maximum value of DepthU to 1024 - used globalParameters MaxDepthU to define maximum value of DepthU - added test case for DepthU=1024 --- Tensile/Common.py | 4 +- .../local_split_u/f8gemm_lsu_mfma.yaml | 51 +++++++++++++++++++ 2 files changed, 53 insertions(+), 2 deletions(-) diff --git a/Tensile/Common.py b/Tensile/Common.py index f69098a3b..9baa3dccd 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -194,7 +194,7 @@ # shouldn't need to change globalParameters["DeviceLDS"] = 65536 # LDS bytes per CU, for computing occupancy globalParameters["MaxLDS"] = 65536 # max LDS a kernel should attempt to use -globalParameters["MaxDepthU"] = 256 # max DepthU value to allow +globalParameters["MaxDepthU"] = 1024 # max DepthU value to allow globalParameters["ShortNames"] = False # on windows kernel names can get too long; =True will convert solution/kernel names to serial ids globalParameters["MergeFiles"] = True # F=store every solution and kernel in separate file; T=store all solutions in single file globalParameters["NumMergedFiles"] = 1 # The number of files that kernels should be split between when merging @@ -339,7 +339,7 @@ def getArchitectureName(gfxName): validISA = [(0,0,0)] validISA.extend(globalParameters["SupportedISA"]) depthUs = list(range(-16, 0)) -depthUs.extend(list(range(2,512+1,1))) +depthUs.extend(list(range(2,globalParameters["MaxDepthU"]+1,1))) for i in validMacroTileSides: for j in validMacroTileSides: validMacroTiles.append([i, j]) diff --git a/Tensile/Tests/extended/local_split_u/f8gemm_lsu_mfma.yaml b/Tensile/Tests/extended/local_split_u/f8gemm_lsu_mfma.yaml index b276061e8..244126573 100644 --- a/Tensile/Tests/extended/local_split_u/f8gemm_lsu_mfma.yaml +++ b/Tensile/Tests/extended/local_split_u/f8gemm_lsu_mfma.yaml @@ -372,4 +372,55 @@ BenchmarkProblems: - ProblemSizes: - Exact: [ 252, 252, 1, 2052] + ######################################## + # B8B8S NN - LSU + large DepthU + ######################################## + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - MatrixInstruction: + - [16, 16, 32, 1, 1, 1, 1, 1,1] # 16x16 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + #- [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + - [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + - [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [4] + - AssertFree1ElementMultiple : [4] + - AssertSummationElementMultiple: [4] + - DepthU: [512,1024]#[8,16,32] + - GlobalSplitU: [1,4] + - GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - 1LDSBuffer: [0] + - LoopTail: [True] + - OptNoLoadLoop: [1] + - PrefetchGlobalRead: [2] + - PrefetchLocalRead: [1,9,17,33] + - ScheduleIterAlg: [3] + - StaggerU: [0] + - SourceSwap: [0,1] + #- TransposeLDS: [0,1] + - GlobalReadVectorWidth: [4]#[4,8] + - VectorWidth: [1]#[2,4] + - VectorAtomicWidth: [-1] + #- WaveSeparateGlobalReadB: [1] + #- MIArchVgpr: [True, False] + - NumElementsPerBatchStore: [0] + - UseSgprForGRO: [0] + #- BufferLoad: [0,1] + #- BufferStore: [0,1] + - TransposeLDS: [1] + - LocalReadVectorWidth: [-1] + #- VgprForLocalReadPacking: [0,1] + #- ClusterLocalRead: [0,1] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Exact: [ 252, 252, 1, 2052] + From 5b24ff13ef62bdf8e1756a619eb5019ce996fdaf Mon Sep 17 00:00:00 2001 From: Torre Zuk <42548444+TorreZuk@users.noreply.github.com> Date: Thu, 23 Nov 2023 11:16:50 -0700 Subject: [PATCH 02/51] tensile build with 16 threads (#1824) --- .jenkins/common.groovy | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.jenkins/common.groovy b/.jenkins/common.groovy index 96561b377..8ca2bb7e6 100644 --- a/.jenkins/common.groovy +++ b/.jenkins/common.groovy @@ -35,6 +35,7 @@ def runCompileCommand(platform, project, jobName, boolean debug=false) // avoid bug causing long build times of certain files. String buildType = 'Release' // debug ? 'Debug' : 'RelWithDebInfo' String parallelJobs = "export HIPCC_COMPILE_FLAGS_APPEND='-O3 -Wno-format-nonliteral -parallel-jobs=4'" + String buildThreads = '16' // if hipcc is used may be multiplied by parallel-jobs // comment @@ -62,7 +63,7 @@ def runCompileCommand(platform, project, jobName, boolean debug=false) pushd build export PATH=/opt/rocm/bin:\$PATH - cmake -DCMAKE_BUILD_TYPE=${buildType} -DCMAKE_CXX_COMPILER=${compiler} -DTensile_ROOT=\$(pwd)/../Tensile ../HostLibraryTests + cmake -DCMAKE_BUILD_TYPE=${buildType} -DCMAKE_CXX_COMPILER=${compiler} -DTensile_CPU_THREADS=${buildThreads} -DTensile_ROOT=\$(pwd)/../Tensile ../HostLibraryTests NPROC_BUILD=16 if [ `nproc` -lt 16 ] then From a575e84eb7086596a58a6cdc14c6ead37cd7207f Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Fri, 24 Nov 2023 09:55:51 +0900 Subject: [PATCH 03/51] Optimized waitcnt lgkmcnt for 1LDSBuffer + PGR>1 (#1822) - removed redundant waitcnt lgkmcnt after 1LDSBuffer sync --- Tensile/KernelWriter.py | 15 +++++++++++---- 1 file changed, 11 insertions(+), 4 deletions(-) diff --git a/Tensile/KernelWriter.py b/Tensile/KernelWriter.py index 7cfea8efb..7074c71cd 100644 --- a/Tensile/KernelWriter.py +++ b/Tensile/KernelWriter.py @@ -1975,9 +1975,9 @@ def setupNewTile(self, kernel, tensorParametersA, tensorParametersB, isPap, isOp ############################################################################## - # get conditions to skip local write wait + # get conditions to skip local read write wait ############################################################################## - def getConditionToSkipLocalWriteWait( self, kernel , isPap, u, lastU): + def getConditionToSkipLocalReadWriteWait( self, kernel , isPap, u, lastU): # not generate wait code here if u == 0 u != lastU and DirectToVgpr + DirectToLds is enabled # (to remove redundant wait. isPap case only) # exception is PGR=2. wait is necessary for u = 0 in PGR=2 case @@ -1990,6 +1990,13 @@ def getConditionToSkipLocalWriteWait( self, kernel , isPap, u, lastU): condSkip = (u%self.numReadsIterCoalescedB != 0) and kernel["EnableMatrixInstruction"] and \ ((kernel["DirectToVgprA"] and (not kernel["ProblemType"]["TLUB"])) or \ (kernel["DirectToVgprB"] and (not kernel["ProblemType"]["TLUA"]))) + # another skip condition + # skip wait for SIA=3 and 1LDSBuffer and PLR > LoopIters and u > localWriteStartIter + # in this case, all local read is executed before 1LDSBuffer sync and no need to wait for local read + if (kernel["ScheduleIterAlg"] == 3 and kernel["1LDSBuffer"] and kernel["PrefetchLocalRead"] > kernel["LoopIters"]): + localWriteStartIter = self.lwStartMfmaIndex//self.numMfmaPerIter + if u > localWriteStartIter: + condSkip = True # no local write wait is necessary in DirectToVgprA + DirectToVgprB case cond2 = not (kernel["DirectToVgprA"] and kernel["DirectToVgprB"]) return cond1 and (not condSkip) and cond2 @@ -2170,7 +2177,7 @@ def noLoadLoopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack # we initiate lgkmcnt to 0, then assigning it correct value in makeSubIterSchedule() if self.enable["Wait"]: - if self.getConditionToSkipLocalWriteWait(kernel, isPap, u, kernel["LoopIters"] - 1): + if self.getConditionToSkipLocalReadWriteWait(kernel, isPap, u, kernel["LoopIters"] - 1): waitCode = self.wait(kernel, tensorParametersA, tensorParametersB, \ -1, 0, 0, \ "wait for prior local read local write") @@ -2743,7 +2750,7 @@ def loopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack, lc, # we initiate lgkmcnt to 0, then assigning it correct value in makeSubIterSchedule() if self.enable["Wait"]: - if self.getConditionToSkipLocalWriteWait(kernel, True, u, kernel["LoopIters"] - 1): + if self.getConditionToSkipLocalReadWriteWait(kernel, True, u, kernel["LoopIters"] - 1): waitCode = self.wait(kernel, tensorParametersA, tensorParametersB, \ -1, 0, 0, \ "wait for prior local read local write") From 48418208a6b1ea771a560d2e9b5b5823f02915e0 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Fri, 24 Nov 2023 09:57:03 +0900 Subject: [PATCH 04/51] reverse MFMA order in inner loop for odd outer iteration (#1823) --- Tensile/KernelWriterAssembly.py | 16 ++++++++++++++++ 1 file changed, 16 insertions(+) diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 18fed4118..31b39d445 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -7175,6 +7175,18 @@ def mfmaIter(self, kernel, u, innerUnroll, vregSetIdx, lastKinloop=False, tail=F # release register if abReg is not None: self.vgprPool.checkIn(abReg) + # conditions to reverse idxInner if idxOuter is odd (for better HW efficiency) + # disable reverse idxInner if one of the following condition is true + # - PGR=2 and u == LoopIters - 1 and DTV + # - wmma + # - complex type + enableReverseInner = True + if (kernel["PrefetchGlobalRead"] == 2 and u == kernel["LoopIters"] - 1 and \ + (kernel["DirectToVgprA"] or kernel["DirectToVgprB"])) or \ + (not is_mfma) or \ + (kernel["ProblemType"]["DataType"].isComplex()): + enableReverseInner = False + prevAccIdx = -1 for iui in range(0, innerUnroll): zgemmVaddSrcCheck = [[], [], []] # to avoid generating redundant v_add @@ -7185,6 +7197,10 @@ def mfmaIter(self, kernel, u, innerUnroll, vregSetIdx, lastKinloop=False, tail=F inner = 1 - outer # inner is the opposite of outer for idxOuter in range(0, kernel["MIWaveTile"][outer]): for idxInner in range(0, kernel["MIWaveTile"][inner]): + # reverse idxInner if idxOuter is odd (for better HW efficiency) + reverseInner = idxOuter & 1 + if enableReverseInner and reverseInner: + idxInner = kernel["MIWaveTile"][inner] - 1 - idxInner idx0 = idxInner idx1 = idxOuter if self.swapMfmaInnerLoop: From 1a0b8d0ce284c8baf96ed537e12bc1fb10c7a6c9 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Mon, 27 Nov 2023 08:48:11 -0700 Subject: [PATCH 05/51] Pre-apply offsets for strided batch kernels (#1826) --- .../hip/HipSolutionAdapter_test.cpp | 4 - .../ocl/OclSolutionAdapter_test.cpp | 2 - Tensile/Components/Signature.py | 9 +- ...128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s | 95 ++++++------------- Tensile/KernelWriterAssembly.py | 55 +++++++---- Tensile/KernelWriterBetaOnly.py | 15 +-- Tensile/KernelWriterConversion.py | 14 +-- Tensile/KernelWriterSource.py | 24 ++--- .../client/include/DataInitialization.hpp | 5 - .../client/source/DataInitialization.cpp | 4 - .../Source/lib/source/ContractionSolution.cpp | 65 +++++++++---- 11 files changed, 144 insertions(+), 148 deletions(-) diff --git a/HostLibraryTests/hip/HipSolutionAdapter_test.cpp b/HostLibraryTests/hip/HipSolutionAdapter_test.cpp index 2b118fc13..a7b08346e 100644 --- a/HostLibraryTests/hip/HipSolutionAdapter_test.cpp +++ b/HostLibraryTests/hip/HipSolutionAdapter_test.cpp @@ -74,8 +74,6 @@ TEST(HipSolutionAdapterTest, BetaOnlyKernel_Zero) k.args.append("D", d_d); k.args.append("C", c_d); - k.args.append("offsetD", desc.offset()); - k.args.append("offsetC", desc.offset()); k.args.append("strideD1", desc.strides()[1]); k.args.append("strideD2", desc.strides()[2]); k.args.append("strideC1", desc.strides()[1]); @@ -149,8 +147,6 @@ TEST(HipSolutionAdapterTest, BetaOnlyKernel_Nonzero) k.args.append("D", d_d); k.args.append("C", c_d); - k.args.append("offsetD", desc.offset()); - k.args.append("offsetC", desc.offset()); k.args.append("strideD1", desc.strides()[1]); k.args.append("strideD2", desc.strides()[2]); k.args.append("strideC1", desc.strides()[1]); diff --git a/HostLibraryTests/ocl/OclSolutionAdapter_test.cpp b/HostLibraryTests/ocl/OclSolutionAdapter_test.cpp index 6dbb55891..e18fd276a 100644 --- a/HostLibraryTests/ocl/OclSolutionAdapter_test.cpp +++ b/HostLibraryTests/ocl/OclSolutionAdapter_test.cpp @@ -82,8 +82,6 @@ KernelInvocation initKernelParams(Tensile::TensorDescriptor const& desc, // k.args.append("C", buffer_C); k.args.append("D", device_d); k.args.append("C", device_c); - k.args.append("offsetD", desc.offset()); - k.args.append("offsetC", desc.offset()); k.args.append("strideD1", desc.strides()[1]); k.args.append("strideD2", desc.strides()[2]); k.args.append("strideC1", desc.strides()[1]); diff --git a/Tensile/Components/Signature.py b/Tensile/Components/Signature.py index 531860a5a..557835e2d 100644 --- a/Tensile/Components/Signature.py +++ b/Tensile/Components/Signature.py @@ -211,10 +211,11 @@ def __call__(self, writer): kStr += self.addArgument( 'WS', '8', offset, "global_buffer", dstValueType, "generic"); offset += 8 kStr += self.addArgument( 'Flags', '8', offset, "global_buffer", dstValueType, "generic"); offset += 8 - kStr += self.addArgument("OffsetD", '8', offset, "by_value", "u64"); offset += 8 - kStr += self.addArgument("OffsetC", '8', offset, "by_value", "u64"); offset += 8 - kStr += self.addArgument("OffsetA", '8', offset, "by_value", "u64"); offset += 8 - kStr += self.addArgument("OffsetB", '8', offset, "by_value", "u64"); offset += 8 + if not kernel["ProblemType"]["StridedBatched"]: + kStr += self.addArgument("OffsetD", '8', offset, "by_value", "u64"); offset += 8 + kStr += self.addArgument("OffsetC", '8', offset, "by_value", "u64"); offset += 8 + kStr += self.addArgument("OffsetA", '8', offset, "by_value", "u64"); offset += 8 + kStr += self.addArgument("OffsetB", '8', offset, "by_value", "u64"); offset += 8 useSize = max(4, cptByte) kStr += self.addArgument( "alpha", useSize, offset, "by_value", cptValueType); offset += useSize diff --git a/Tensile/CustomKernels/DGEMM_Aldebaran_NN_MT128x128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s b/Tensile/CustomKernels/DGEMM_Aldebaran_NN_MT128x128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s index b2c37f346..6199997f3 100644 --- a/Tensile/CustomKernels/DGEMM_Aldebaran_NN_MT128x128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s +++ b/Tensile/CustomKernels/DGEMM_Aldebaran_NN_MT128x128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s @@ -137,134 +137,114 @@ amdhsa.kernels: .value_kind: global_buffer .value_type: f64 .address_space: generic - - .name: OffsetD - .size: 8 - .offset: 56 - .value_kind: by_value - .value_type: u64 - - .name: OffsetC - .size: 8 - .offset: 64 - .value_kind: by_value - .value_type: u64 - - .name: OffsetA - .size: 8 - .offset: 72 - .value_kind: by_value - .value_type: u64 - - .name: OffsetB - .size: 8 - .offset: 80 - .value_kind: by_value - .value_type: u64 - .name: alpha .size: 8 - .offset: 88 + .offset: 56 .value_kind: by_value .value_type: f64 - .name: beta .size: 8 - .offset: 96 + .offset: 64 .value_kind: by_value .value_type: f64 - .name: strideD0 .size: 4 - .offset: 104 + .offset: 72 .value_kind: by_value .value_type: u32 - .name: strideD1 .size: 4 - .offset: 108 + .offset: 76 .value_kind: by_value .value_type: u32 - .name: strideC0 .size: 4 - .offset: 112 + .offset: 80 .value_kind: by_value .value_type: u32 - .name: strideC1 .size: 4 - .offset: 116 + .offset: 84 .value_kind: by_value .value_type: u32 - .name: strideA0 .size: 4 - .offset: 120 + .offset: 88 .value_kind: by_value .value_type: u32 - .name: strideA1 .size: 4 - .offset: 124 + .offset: 92 .value_kind: by_value .value_type: u32 - .name: strideB0 .size: 4 - .offset: 128 + .offset: 96 .value_kind: by_value .value_type: u32 - .name: strideB1 .size: 4 - .offset: 132 + .offset: 100 .value_kind: by_value .value_type: u32 - .name: SizesFree0 .size: 4 - .offset: 136 + .offset: 104 .value_kind: by_value .value_type: u32 - .name: SizesFree1 .size: 4 - .offset: 140 + .offset: 108 .value_kind: by_value .value_type: u32 - .name: SizesFree2 .size: 4 - .offset: 144 + .offset: 112 .value_kind: by_value .value_type: u32 - .name: SizesSum0 .size: 4 - .offset: 148 + .offset: 116 .value_kind: by_value .value_type: u32 - .name: OrigStaggerUIter .size: 4 - .offset: 152 + .offset: 120 .value_kind: by_value .value_type: i32 - .name: NumWorkGroups0 .size: 4 - .offset: 156 + .offset: 124 .value_kind: by_value .value_type: u32 - .name: NumWorkGroups1 .size: 4 - .offset: 160 + .offset: 128 .value_kind: by_value .value_type: u32 - .name: NumFullBlocks .size: 4 - .offset: 164 + .offset: 132 .value_kind: by_value .value_type: u32 - .name: WgmRemainder1 .size: 4 - .offset: 168 + .offset: 136 .value_kind: by_value .value_type: u32 - .name: MagicNumberWgmRemainder1 .size: 4 - .offset: 172 + .offset: 140 .value_kind: by_value .value_type: u32 - .name: padding .size: 4 - .offset: 176 + .offset: 144 .value_kind: by_value .value_type: u32 .group_segment_fixed_size: 32768 .kernarg_segment_align: 8 - .kernarg_segment_size: 184 + .kernarg_segment_size: 152 .max_flat_workgroup_size: 256 .private_segment_fixed_size: 0 .sgpr_count: 73 @@ -597,10 +577,7 @@ DGEMM_Aldebaran_NN_MT128x128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4: .set sgprAddressC, 30 .set sgprAddressA, 32 .set sgprAddressB, 34 -.set sgprOffsetD, 36 -.set sgprOffsetC, 38 -.set sgprOffsetA, 40 -.set sgprOffsetB, 42 +/* offsets pre-applied */ .set sgprAlpha, 44 .set sgprBeta, 46 .set sgprStridesD, 48 @@ -740,27 +717,13 @@ v_mov_b32 v[vgprSerial], v0 // thread serial id /* Load Kernel Args */ s_load_dwordx16 s[24:39], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x8 // -s_load_dwordx16 s[40:55], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x48 // -s_load_dwordx8 s[56:63], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x88 // -s_load_dwordx2 s[64:65], s[sgprKernArgAddress:sgprKernArgAddress+1], 0xA8 // +s_load_dwordx16 s[48:63], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x48 // +s_load_dwordx2 s[64:65], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x88 // s_waitcnt lgkmcnt(0) // wait for 160 bytes of kern args -s_lshl_b64 s[sgprOffsetD:sgprOffsetD+1], s[sgprOffsetD:sgprOffsetD+1], 0x3 // elements offset to bytes offset -s_add_u32 s[sgprAddressD+0], s[sgprAddressD+0], s[sgprOffsetD] // add offset to buffer address -s_addc_u32 s[sgprAddressD+1], s[sgprAddressD+1], s[sgprOffsetD+1] // add offset to buffer address -s_lshl_b64 s[sgprOffsetC:sgprOffsetC+1], s[sgprOffsetC:sgprOffsetC+1], 0x3 // elements offset to bytes offset -s_add_u32 s[sgprAddressC+0], s[sgprAddressC+0], s[sgprOffsetC] // add offset to buffer address -s_addc_u32 s[sgprAddressC+1], s[sgprAddressC+1], s[sgprOffsetC+1] // add offset to buffer address -s_lshl_b64 s[sgprOffsetA:sgprOffsetA+1], s[sgprOffsetA:sgprOffsetA+1], 0x3 // elements offset to bytes offset -s_add_u32 s[sgprAddressA+0], s[sgprAddressA+0], s[sgprOffsetA] // add offset to buffer address -s_addc_u32 s[sgprAddressA+1], s[sgprAddressA+1], s[sgprOffsetA+1] // add offset to buffer address -s_lshl_b64 s[sgprOffsetB:sgprOffsetB+1], s[sgprOffsetB:sgprOffsetB+1], 0x3 // elements offset to bytes offset -s_add_u32 s[sgprAddressB+0], s[sgprAddressB+0], s[sgprOffsetB] // add offset to buffer address -s_addc_u32 s[sgprAddressB+1], s[sgprAddressB+1], s[sgprOffsetB+1] // add offset to buffer address - -.set OffsetD, UNDEF -.set OffsetC, UNDEF -.set OffsetA, UNDEF -.set OffsetB, UNDEF +s_mov_b32 s44, s36 +s_mov_b32 s45, s37 +s_mov_b32 s46, s38 +s_mov_b32 s47, s39 /* Short circuit condition if Alpha == 0, then sumDims=0 */ v_cmp_eq_f64 vcc, s[sgprAlpha:sgprAlpha+1], 0.0 // Alpha == 0.0 ? diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 31b39d445..3601120ea 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -1715,10 +1715,10 @@ def initKernel(self, kernel, tPA, tPB ): self.numSgprStridesB -= 1 self.numSgprSizesSum = kernel["ProblemType"]["NumIndicesSummation"] self.numSgprSizesFree = kernel["ProblemType"]["NumIndicesC"] - self.numSgprOffsetD = 2 - self.numSgprOffsetC = 2 - self.numSgprOffsetA = 2 - self.numSgprOffsetB = 2 + self.numSgprOffsetD = 0 + self.numSgprOffsetC = 0 + self.numSgprOffsetA = 0 + self.numSgprOffsetB = 0 self.numSgprAddressDbg = self.rpga if globalParameters["DebugKernel"] else 0 #################################### @@ -1846,10 +1846,15 @@ def initKernel(self, kernel, tPA, tPB ): self.defineSgpr("AddressFlags", numSgprAddressFlags) self.argOffsetOffset += (numSgprAddressWS + numSgprAddressFlags) * 4 - self.defineSgpr("OffsetD", self.numSgprOffsetD) - self.defineSgpr("OffsetC", self.numSgprOffsetC) - self.defineSgpr("OffsetA", self.numSgprOffsetA) - self.defineSgpr("OffsetB", self.numSgprOffsetB) + if not kernel["ProblemType"]["StridedBatched"]: + self.numSgprOffsetD = 2 + self.numSgprOffsetC = 2 + self.numSgprOffsetA = 2 + self.numSgprOffsetB = 2 + self.defineSgpr("OffsetD", self.numSgprOffsetD) + self.defineSgpr("OffsetC", self.numSgprOffsetC) + self.defineSgpr("OffsetA", self.numSgprOffsetA) + self.defineSgpr("OffsetB", self.numSgprOffsetB) self.defineSgpr("Alpha", numSgprAlpha, numSgprAlpha) if kernel["ProblemType"]["UseBeta"]: @@ -3374,7 +3379,7 @@ def allocateResources(self, kernel, lraCode=None): self.sgprAddressStrCD = "Srd" # add offset to buffer - if not kernel["_GlobalAccumulation"] or kernel["_GlobalAccumulation"] == 'PartialsBuffer': + if not kernel["ProblemType"]["StridedBatched"] and (not kernel["_GlobalAccumulation"] or kernel["_GlobalAccumulation"] == 'PartialsBuffer'): kStr += inst("s_lshl_b64", sgpr("OffsetD", 2), sgpr("OffsetD", 2), hex(log2(self.bpeCexternal)), "elements offset to bytes offset") kStr += inst("s_add_u32", sgpr("%sD+0"%self.sgprAddressStrCD), sgpr("AddressD+0"), sgpr("OffsetD"), "add offset to buffer address") kStr += inst("s_addc_u32", sgpr("%sD+1"%self.sgprAddressStrCD), sgpr("AddressD+1"), sgpr("OffsetD+1"), "add offset to buffer address") @@ -3393,13 +3398,20 @@ def allocateResources(self, kernel, lraCode=None): dstAddressA1Str = sgpr("%sA+1"%self.sgprAddressStrAB) dstAddressB0Str = sgpr("%sB+0"%self.sgprAddressStrAB) dstAddressB1Str = sgpr("%sB+1"%self.sgprAddressStrAB) - kStr += inst("s_lshl_b64", sgpr("OffsetA", 2), sgpr("OffsetA", 2), hex(log2(self.bpeAB)), "elements offset to bytes offset") - kStr += inst("s_add_u32", dstAddressA0Str, sgpr("AddressA+0"), sgpr("OffsetA"), "add offset to buffer address") - kStr += inst("s_addc_u32", dstAddressA1Str, sgpr("AddressA+1"), sgpr("OffsetA+1"), "add offset to buffer address") - - kStr += inst("s_lshl_b64", sgpr("OffsetB", 2), sgpr("OffsetB", 2), hex(log2(self.bpeAB)), "elements offset to bytes offset") - kStr += inst("s_add_u32", dstAddressB0Str, sgpr("AddressB+0"), sgpr("OffsetB"), "add offset to buffer address") - kStr += inst("s_addc_u32", dstAddressB1Str, sgpr("AddressB+1"), sgpr("OffsetB+1"), "add offset to buffer address") + if not kernel["ProblemType"]["StridedBatched"]: + kStr += inst("s_lshl_b64", sgpr("OffsetA", 2), sgpr("OffsetA", 2), hex(log2(self.bpeAB)), "elements offset to bytes offset") + kStr += inst("s_add_u32", dstAddressA0Str, sgpr("AddressA+0"), sgpr("OffsetA"), "add offset to buffer address") + kStr += inst("s_addc_u32", dstAddressA1Str, sgpr("AddressA+1"), sgpr("OffsetA+1"), "add offset to buffer address") + + kStr += inst("s_lshl_b64", sgpr("OffsetB", 2), sgpr("OffsetB", 2), hex(log2(self.bpeAB)), "elements offset to bytes offset") + kStr += inst("s_add_u32", dstAddressB0Str, sgpr("AddressB+0"), sgpr("OffsetB"), "add offset to buffer address") + kStr += inst("s_addc_u32", dstAddressB1Str, sgpr("AddressB+1"), sgpr("OffsetB+1"), "add offset to buffer address") + elif self.releaseSgprAdressAB: + # copy AddressA,B to srdA,B to undefine AddressA,B + kStr += inst("s_mov_b32", sgpr("%sA+0"%self.sgprAddressStrAB), sgpr("AddressA+0"), "copy addressA") + kStr += inst("s_mov_b32", sgpr("%sA+1"%self.sgprAddressStrAB), sgpr("AddressA+1"), "copy addressA") + kStr += inst("s_mov_b32", sgpr("%sB+0"%self.sgprAddressStrAB), sgpr("AddressB+0"), "copy addressB") + kStr += inst("s_mov_b32", sgpr("%sB+1"%self.sgprAddressStrAB), sgpr("AddressB+1"), "copy addressB") # self.groOffsetInMacroTile == 1 case, subtract pre-pad here if self.groOffsetInMacroTile: @@ -3412,12 +3424,13 @@ def allocateResources(self, kernel, lraCode=None): kStr += inst("s_sub_u32", dstAddressB0Str, dstAddressB0Str, prePad, "pre-pad to make room for possible pointer shift") kStr += inst("s_subb_u32", dstAddressB1Str, dstAddressB1Str, 0, "pre-pad to make room for possible pointer shift") - # undefine Offset sgpr + # undefine Offset sgpr (only for general batch) kStr += self.endLine - kStr += self.undefineSgpr("OffsetD") - kStr += self.undefineSgpr("OffsetC") - kStr += self.undefineSgpr("OffsetA") - kStr += self.undefineSgpr("OffsetB") + if not kernel["ProblemType"]["StridedBatched"]: + kStr += self.undefineSgpr("OffsetD") + kStr += self.undefineSgpr("OffsetC") + kStr += self.undefineSgpr("OffsetA") + kStr += self.undefineSgpr("OffsetB") # undefine Address sgpr if self.releaseSgprAdressCD: kStr += self.undefineSgpr("AddressD") diff --git a/Tensile/KernelWriterBetaOnly.py b/Tensile/KernelWriterBetaOnly.py index 28bc91391..3ce38038a 100644 --- a/Tensile/KernelWriterBetaOnly.py +++ b/Tensile/KernelWriterBetaOnly.py @@ -76,8 +76,9 @@ def functionSignature(self): kStr += " " + ptrStr + " const * " + batch + "C," + self.endLine # offset - kStr += " uint64_t offsetD,%s" % self.endLine - kStr += " uint64_t offsetC,%s" % self.endLine + if not isStridedBuffer: + kStr += " uint64_t offsetD,%s" % self.endLine + kStr += " uint64_t offsetC,%s" % self.endLine # strides firstStrideCD = 1 @@ -191,11 +192,11 @@ def kernelBodyBetaOnly(self): zeroStr = self.state["ProblemType"]["ComputeDataType"].zeroString(self.language, 1) kStr += " " + ptrStr + f" const* C = (beta == {zeroStr}) ? nullptr : BatchC[wg];" + self.endLine - # apply offset - kStr += self.endLine - if not self.state["_GlobalAccumulation"]: - kStr += " D = D + offsetD;" + self.endLine - kStr += " C = C + offsetC;" + self.endLine + # apply offset only for general batch + kStr += self.endLine + if not self.state["_GlobalAccumulation"]: + kStr += " D = D + offsetD;" + self.endLine + kStr += " C = C + offsetC;" + self.endLine kStr += self.endLine diff --git a/Tensile/KernelWriterConversion.py b/Tensile/KernelWriterConversion.py index a612562da..34919ca9e 100644 --- a/Tensile/KernelWriterConversion.py +++ b/Tensile/KernelWriterConversion.py @@ -77,8 +77,9 @@ def functionSignature(self): kStr += " " + ptrStr + " const * " + bStr + "C," + self.endLine # offset - kStr += " uint64_t offsetD,%s" % self.endLine - kStr += " uint64_t offsetC,%s" % self.endLine + if not self.state["ProblemType"]["StridedBatched"]: + kStr += " uint64_t offsetD,%s" % self.endLine + kStr += " uint64_t offsetC,%s" % self.endLine # alpha & beta kStr += " %s const alpha,%s" % (self.state["ProblemType"]["ComputeDataType"].toDevice(self.language), self.endLine) @@ -231,11 +232,10 @@ def kernelBody(self): zeroStr = self.state["ProblemType"]["ComputeDataType"].zeroString(self.language, 1) kStr += " " + ptrStr + f" const* C = (beta == {zeroStr}) ? nullptr : BatchC[wg];" + self.endLine - ######################################## - # apply offset - kStr += self.endLine - kStr += " D = D + offsetD;" + self.endLine - kStr += " C = C + offsetC;" + self.endLine + # apply offset only for general batch + kStr += self.endLine + kStr += " D = D + offsetD;" + self.endLine + kStr += " C = C + offsetC;" + self.endLine ######################################## # D index diff --git a/Tensile/KernelWriterSource.py b/Tensile/KernelWriterSource.py index 965df5755..df13aee45 100644 --- a/Tensile/KernelWriterSource.py +++ b/Tensile/KernelWriterSource.py @@ -862,10 +862,11 @@ def functionSignature(self, kernel ): s += " " + globalStr + ptrStr + " const * " + batchStr + "B" # offset - s += "," + self.endLine + " uint64_t offsetD" - s += "," + self.endLine + " uint64_t offsetC" - s += "," + self.endLine + " uint64_t offsetA" - s += "," + self.endLine + " uint64_t offsetB" + if not kernel["ProblemType"]["StridedBatched"]: + s += "," + self.endLine + " uint64_t offsetD" + s += "," + self.endLine + " uint64_t offsetC" + s += "," + self.endLine + " uint64_t offsetA" + s += "," + self.endLine + " uint64_t offsetB" # alpha & beta s += "," + self.endLine + " " \ @@ -1070,14 +1071,13 @@ def allocateResources(self, kernel, lraCode=None): kStr += f" DATA_TYPE const* A = ((alpha == {zeroStr}) || (sizeUnroll == 0)) ? nullptr : BatchA[wg];" + self.endLine kStr += f" DATA_TYPE const* B = ((alpha == {zeroStr}) || (sizeUnroll == 0)) ? nullptr : BatchB[wg];" + self.endLine - #################################### - # apply offset - kStr += self.endLine - if not kernel["_GlobalAccumulation"]: - kStr += " D = D + offsetD;" + self.endLine - kStr += " C = C + offsetC;" + self.endLine - kStr += " A = A + offsetA;" + self.endLine - kStr += " B = B + offsetB;" + self.endLine + # apply offset only for general batch + kStr += self.endLine + if not kernel["_GlobalAccumulation"]: + kStr += " D = D + offsetD;" + self.endLine + kStr += " C = C + offsetC;" + self.endLine + kStr += " A = A + offsetA;" + self.endLine + kStr += " B = B + offsetB;" + self.endLine if 0: # in some cases we know the pad values at compile time and could hard-code here. Not enabled. diff --git a/Tensile/Source/client/include/DataInitialization.hpp b/Tensile/Source/client/include/DataInitialization.hpp index 7e901bc00..32bb98263 100644 --- a/Tensile/Source/client/include/DataInitialization.hpp +++ b/Tensile/Source/client/include/DataInitialization.hpp @@ -468,11 +468,6 @@ namespace Tensile InitMode m_aInit, m_bInit, m_cInit, m_dInit; InitMode m_alphaInit, m_betaInit; - size_t m_aBufferOffset; - size_t m_bBufferOffset; - size_t m_cBufferOffset; - size_t m_dBufferOffset; - size_t m_aMaxElements; size_t m_bMaxElements; size_t m_cMaxElements; diff --git a/Tensile/Source/client/source/DataInitialization.cpp b/Tensile/Source/client/source/DataInitialization.cpp index 34f739fbb..7928a85c7 100644 --- a/Tensile/Source/client/source/DataInitialization.cpp +++ b/Tensile/Source/client/source/DataInitialization.cpp @@ -392,10 +392,6 @@ namespace Tensile , m_dInit(args["init-d"].as()) , m_alphaInit(args["init-alpha"].as()) , m_betaInit(args["init-beta"].as()) - , m_aBufferOffset(args["offset-a"].as()) - , m_bBufferOffset(args["offset-b"].as()) - , m_cBufferOffset(args["offset-c"].as()) - , m_dBufferOffset(args["offset-d"].as()) , m_aMaxElements(0) , m_bMaxElements(0) , m_cMaxElements(0) diff --git a/Tensile/Source/lib/source/ContractionSolution.cpp b/Tensile/Source/lib/source/ContractionSolution.cpp index e9fb8590a..2ed74c37c 100644 --- a/Tensile/Source/lib/source/ContractionSolution.cpp +++ b/Tensile/Source/lib/source/ContractionSolution.cpp @@ -394,8 +394,12 @@ namespace Tensile } else if(problemType.stridedBatched) { - rv.args.append("d", inputs.d); - rv.args.append("c", inputs.c); + auto dptr = inputs.d; + dptr += d.offset(); + auto cptr = inputs.c; + cptr += c.offset(); + rv.args.append("d", dptr); + rv.args.append("c", cptr); } else { @@ -405,8 +409,12 @@ namespace Tensile if(problemType.stridedBatched) { - rv.args.append("a", inputs.a); - rv.args.append("b", inputs.b); + auto aptr = inputs.a; + aptr += a.offset(); + auto bptr = inputs.b; + bptr += b.offset(); + rv.args.append("a", aptr); + rv.args.append("b", bptr); } else { @@ -424,10 +432,13 @@ namespace Tensile rv.args.append("Flags", flags); } - rv.args.append("offsetD", d.offset()); - rv.args.append("offsetC", c.offset()); - rv.args.append("offsetA", a.offset()); - rv.args.append("offsetB", b.offset()); + if(!problemType.stridedBatched) + { + rv.args.append("offsetD", d.offset()); + rv.args.append("offsetC", c.offset()); + rv.args.append("offsetA", a.offset()); + rv.args.append("offsetB", b.offset()); + } rv.args.append("alpha", inputs.alpha); if(std::is_same::value && !isSourceKernel()) @@ -788,17 +799,28 @@ namespace Tensile if(sizeMapping.globalAccumulation) rv.args.append("WS", inputs.ws); else if(problemType.stridedBatched) - rv.args.append("D", inputs.d); + { + auto dptr = inputs.d; + dptr += d.offset(); + rv.args.append("D", dptr); + } else rv.args.append("batchD", inputs.batchD); if(problemType.stridedBatched) - rv.args.append("C", inputs.c); + { + auto cptr = inputs.c; + cptr += c.offset(); + rv.args.append("C", cptr); + } else rv.args.append("batchC", inputs.batchC); - rv.args.append("offsetD", d.offset()); - rv.args.append("offsetC", c.offset()); + if(!problemType.stridedBatched) + { + rv.args.append("offsetD", d.offset()); + rv.args.append("offsetC", c.offset()); + } if(sizeMapping.globalAccumulation) { @@ -954,19 +976,30 @@ namespace Tensile rv.numWorkItems.z = rv.workGroupSize.z * rv.numWorkGroups.z; if(problemType.stridedBatched) - rv.args.append("D", inputs.d); + { + auto dptr = inputs.d; + dptr += d.offset(); + rv.args.append("D", dptr); + } else rv.args.append("batchD", inputs.batchD); rv.args.append("WS", inputs.ws); if(problemType.stridedBatched) - rv.args.append("C", inputs.c); + { + auto cptr = inputs.c; + cptr += c.offset(); + rv.args.append("C", cptr); + } else rv.args.append("batchC", inputs.batchC); - rv.args.append("offsetD", d.offset()); - rv.args.append("offsetC", c.offset()); + if(!problemType.stridedBatched) + { + rv.args.append("offsetD", d.offset()); + rv.args.append("offsetC", c.offset()); + } if(sizeMapping.globalAccumulation == 2) rv.args.append("alpha", inputs.alpha); From 9e8f1ab9b708c52271dd53d5e20d45c59d3b5993 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Tue, 28 Nov 2023 05:43:56 +0900 Subject: [PATCH 06/51] Optimization for ShadowLimit (#1829) - removed ShadowLimit code with the following conditions noTailLoop + BufferLoad + no FractionalLoad + no transpose (TLU case) + MT and Depth are power of 2 (plus more conditions) --- Tensile/KernelWriter.py | 23 +++++ Tensile/KernelWriterAssembly.py | 147 ++++++++++++++++++-------------- 2 files changed, 104 insertions(+), 66 deletions(-) diff --git a/Tensile/KernelWriter.py b/Tensile/KernelWriter.py index 7074c71cd..4bdc974e1 100644 --- a/Tensile/KernelWriter.py +++ b/Tensile/KernelWriter.py @@ -3748,6 +3748,29 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): self.tailLoopInNLL = noTailLoop >= 2 self.noEarlyExitForTailLoopInNLL = noTailLoop == 3 + # no ShadowLimit code in loop optimization + # we do not need ShadowLimit check in loop under certain conditions + # noTailLoop=1 (TODO: support TailLoop) + # BufferLoad + # FractionalLoad==0 + # no packBatchDims + # EdgeType == Shift + # CheckDimOverflow < 2 + # MT0, MT1, DepthU are power of 2 + # TLU case only + def isPowerOf2(val): + return val > 0 and (val & (val - 1)) == 0 + self.noShadowLimitCodeInLoopA = False + self.noShadowLimitCodeInLoopB = False + if noTailLoop == 1 and kernel["BufferLoad"] and kernel["FractionalLoad"] == 0 and \ + kernel["PackBatchDims"] == 0 and kernel["EdgeType"] == "ShiftPtr" and \ + kernel["CheckDimOverflow"] <= 1 and \ + isPowerOf2(kernel["MacroTileA"]) and isPowerOf2(kernel["MacroTileB"]) and isPowerOf2(kernel["DepthU"]): + if tluA: + self.noShadowLimitCodeInLoopA = True + if tluB: + self.noShadowLimitCodeInLoopB = True + self.actualSummationLoops = 1 if kernel["PackSummationDims"] else kernel["ProblemType"]["NumIndicesSummation"] self.otherSummationLoops = self.actualSummationLoops-1 self.otherSummations = kernel["ProblemType"]["NumIndicesSummation"]-1 # not loops but summations vars diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 3601120ea..0dcd67d3d 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -596,8 +596,10 @@ def defineVariableSgprs(self, kernel): self.defineSgpr("PerpOverhangVccB", 2, 2) if self.use64bShadowLimit: # If need more SGPR could overlap this with the Tensor2dSize regs - self.defineSgpr("ShadowLimitA", 2, 2) - self.defineSgpr("ShadowLimitB", 2, 2) + if self.noShadowLimitCodeInLoopA == False: + self.defineSgpr("ShadowLimitA", 2, 2) + if self.noShadowLimitCodeInLoopB == False: + self.defineSgpr("ShadowLimitB", 2, 2) if kernel["PackSummationDims"]: for tc in ('A','B'): @@ -4929,38 +4931,44 @@ def computeLoadSrd(self, kernel, tP, tc, indices, bpe, isPap): kStr += inst("s_mov_b32", sgpr(tileStart+0), 0, "set default tileStart") kStr += inst("s_mov_b32", sgpr(tileStart+1), 0, "set default tileStart") - if self.use64bShadowLimit: - limitTmp0 = "ShadowLimit%s+0"%tc - limitTmp1 = "ShadowLimit%s+1"%tc - else: - limitTmp0 = stmp+0 - limitTmp1 = stmp+1 - - kStr += inst("s_sub_u32", sgpr(limitTmp0), sgpr("Tensor2dSize%s"%tc), sgpr(tileStart+0), "sub tileStart") - kStr += inst("s_subb_u32", sgpr(limitTmp1), sgpr("Tensor2dSize%s+1"%tc), sgpr(tileStart+1), "sub tileStart") - - if self.use64bShadowLimit: - # Set initial buffer limit - # if the limit is >64bit, incrementSrd decrements the shadow as the SRD increments, - # and when we get within 32-bit we start to step down the SRD - # if the limit is <32bits, set it accurately here: - # Note lshl_b64 the higher-numbered SGPR has the upper 32-bits - kStr += inst("s_lshl_b64", sgpr("ShadowLimit%s"%tc,2), sgpr("ShadowLimit%s"%tc,2), \ - hex(log2(tP["bpe"])), "Set limit to use bytes") - if prePad: - kStr += inst("s_add_u32", sgpr("ShadowLimit%s+0"%tc), sgpr("ShadowLimit%s+0"%tc), prePad, "extend limit for pre-pad") - kStr += inst("s_addc_u32", sgpr("ShadowLimit%s+1"%tc), sgpr("ShadowLimit%s+1"%tc), 0, "extend limit for pre-pad") + noShadowLimitCodeInLoop = self.noShadowLimitCodeInLoopA if tc == "A" else self.noShadowLimitCodeInLoopB + if noShadowLimitCodeInLoop == False: + if self.use64bShadowLimit: + limitTmp0 = "ShadowLimit%s+0"%tc + limitTmp1 = "ShadowLimit%s+1"%tc + else: + limitTmp0 = stmp+0 + limitTmp1 = stmp+1 - if kernel["DirectToLds%s"%tc] and kernel["UseInstOffsetForGRO"]: - kStr += inst("s_add_u32", sgpr("ShadowLimit%s+0"%tc), sgpr("ShadowLimit%s+0"%tc), self.buff_load_inst_offset_max, "extend limit for directToLDS instruction offset") - kStr += inst("s_addc_u32", sgpr("ShadowLimit%s+1"%tc), sgpr("ShadowLimit%s+1"%tc), 0, "extend limit for directToLDS instruction offset") + kStr += inst("s_sub_u32", sgpr(limitTmp0), sgpr("Tensor2dSize%s"%tc), sgpr(tileStart+0), "sub tileStart") + kStr += inst("s_subb_u32", sgpr(limitTmp1), sgpr("Tensor2dSize%s+1"%tc), sgpr(tileStart+1), "sub tileStart") - kStr += inst("s_cmp_eq_u32", sgpr("ShadowLimit%s+1"%tc), 0, "are we within 2^32?") - kStr += inst("s_cselect_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "BufferLimit%s"%tc, "Move shadow to real if we are within 2^32") + if self.use64bShadowLimit: + # Set initial buffer limit + # if the limit is >64bit, incrementSrd decrements the shadow as the SRD increments, + # and when we get within 32-bit we start to step down the SRD + # if the limit is <32bits, set it accurately here: + # Note lshl_b64 the higher-numbered SGPR has the upper 32-bits + kStr += inst("s_lshl_b64", sgpr("ShadowLimit%s"%tc,2), sgpr("ShadowLimit%s"%tc,2), \ + hex(log2(tP["bpe"])), "Set limit to use bytes") + if prePad: + kStr += inst("s_add_u32", sgpr("ShadowLimit%s+0"%tc), sgpr("ShadowLimit%s+0"%tc), prePad, "extend limit for pre-pad") + kStr += inst("s_addc_u32", sgpr("ShadowLimit%s+1"%tc), sgpr("ShadowLimit%s+1"%tc), 0, "extend limit for pre-pad") + + if kernel["DirectToLds%s"%tc] and kernel["UseInstOffsetForGRO"]: + kStr += inst("s_add_u32", sgpr("ShadowLimit%s+0"%tc), sgpr("ShadowLimit%s+0"%tc), self.buff_load_inst_offset_max, "extend limit for directToLDS instruction offset") + kStr += inst("s_addc_u32", sgpr("ShadowLimit%s+1"%tc), sgpr("ShadowLimit%s+1"%tc), 0, "extend limit for directToLDS instruction offset") + + kStr += inst("s_cmp_eq_u32", sgpr("ShadowLimit%s+1"%tc), 0, "are we within 2^32?") + kStr += inst("s_cselect_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "BufferLimit%s"%tc, "Move shadow to real if we are within 2^32") + else: + # put limit directly into SRD: + kStr += inst("s_lshl_b32", sgpr("Srd%s+2"%tc), sgpr(stmp+0), hex(log2(tP["bpe"])), "Set limit to use bytes") + kStr += inst("s_add_u32", sgpr("Srd%s+2"%tc), sgpr("Srd%s+2"%tc), prePad, "extend limit for pre-pad") else: - # put limit directly into SRD: - kStr += inst("s_lshl_b32", sgpr("Srd%s+2"%tc), sgpr(stmp+0), hex(log2(tP["bpe"])), "Set limit to use bytes") - kStr += inst("s_add_u32", sgpr("Srd%s+2"%tc), sgpr("Srd%s+2"%tc), prePad, "extend limit for pre-pad") + # noShadowLimitCodeInLoop case + # no out of range check + kStr += inst("s_mov_b32", sgpr("Srd%s+2"%tc), "BufferLimit%s"%tc, "Set BufferLimit in no ShadowLimit code case") # Apply any high-order address components to the tileStart and eventually the SRD - batch idx for batched gemm if kernel["ProblemType"]["StridedBatched"]: @@ -5051,7 +5059,8 @@ def computeLoadSrd(self, kernel, tP, tc, indices, bpe, isPap): # invalid global read for performance evaluation only if self.enable["InvalidGlobalRead%s"%tc]: kStr += inst("s_mov_b32", sgpr("Srd%s+2"%tc), hex(0), "set out-of-bound addr for performance evaluation only") - kStr += inst("s_mov_b32", sgpr("ShadowLimit%s+1"%tc), hex(0xffffffff), "set out-of-bound addr for performance evaluation only") + if noShadowLimitCodeInLoop == False: + kStr += inst("s_mov_b32", sgpr("ShadowLimit%s+1"%tc), hex(0xffffffff), "set out-of-bound addr for performance evaluation only") return kStr @@ -7736,32 +7745,34 @@ def incrementSrd(self, kernel, tP, incLower, incUpper, checkShadowLimitCopy=True incUpper, \ "gra SRD += inc(upper)" ) - # also have to move the boundary since we change the base - # so less buffers to the edge: - if self.use64bShadowLimit: - imod.addInst("s_sub_u32", \ - sgpr("ShadowLimit%s+0"%tc), \ - sgpr("ShadowLimit%s+0"%tc), \ - incLower, \ - "limit -= inc)") - imod.addInst("s_subb_u32", \ - sgpr("ShadowLimit%s+1"%tc), \ - sgpr("ShadowLimit%s+1"%tc), \ - incUpper, \ - "limit -= inc)" ) - if checkShadowLimitCopy: - imod.addInst("s_cmp_eq_u32", sgpr("ShadowLimit%s+1"%tc), 0, "are we within 2^32?") - if self.staggerU: - # staggerU case, need to restore BufferLimit when ShadowLimit goes to negative value - imod.addInst("s_cselect_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "BufferLimit%s"%tc, "Move shadow to real if we are within 2^32") - else: - imod.addInst("s_cmov_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "Move shadow to real if we are within 2^32") - else: - imod.addInst("s_sub_u32", \ - sgpr("Srd%s+2"%(tc)), \ - sgpr("Srd%s+2"%(tc)), \ - incLower, \ - "limit -= inc)" ) + noShadowLimitCodeInLoop = self.noShadowLimitCodeInLoopA if tc == "A" else self.noShadowLimitCodeInLoopB + if noShadowLimitCodeInLoop == False: + # also have to move the boundary since we change the base + # so less buffers to the edge: + if self.use64bShadowLimit: + imod.addInst("s_sub_u32", \ + sgpr("ShadowLimit%s+0"%tc), \ + sgpr("ShadowLimit%s+0"%tc), \ + incLower, \ + "limit -= inc)") + imod.addInst("s_subb_u32", \ + sgpr("ShadowLimit%s+1"%tc), \ + sgpr("ShadowLimit%s+1"%tc), \ + incUpper, \ + "limit -= inc)" ) + if checkShadowLimitCopy: + imod.addInst("s_cmp_eq_u32", sgpr("ShadowLimit%s+1"%tc), 0, "are we within 2^32?") + if self.staggerU: + # staggerU case, need to restore BufferLimit when ShadowLimit goes to negative value + imod.addInst("s_cselect_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "BufferLimit%s"%tc, "Move shadow to real if we are within 2^32") + else: + imod.addInst("s_cmov_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "Move shadow to real if we are within 2^32") + else: + imod.addInst("s_sub_u32", \ + sgpr("Srd%s+2"%(tc)), \ + sgpr("Srd%s+2"%(tc)), \ + incLower, \ + "limit -= inc)" ) return imod ############################################################################## @@ -8015,12 +8026,14 @@ def globalReadIncrementAB(self, kernel, loopIdx, prefetchIndex, incs=1): for tc in ('A','B'): incCodeA.addInst("s_mov_b32", sgpr("Srd%s+0"%tc), sgpr("InitialSrd%sBase+0"%tc), "restore base") incCodeA.addInst("s_mov_b32", sgpr("Srd%s+1"%tc), sgpr("InitialSrd%sBase+1"%tc), "restore base") - if self.use64bShadowLimit: - incCodeA.addInst("s_mov_b32", sgpr("ShadowLimit%s+0"%tc), sgpr("InitialSrd%sLimit+0"%tc), "restore shadow limit") - incCodeA.addInst("s_mov_b32", sgpr("ShadowLimit%s+1"%tc), sgpr("InitialSrd%sLimit+1"%tc), "restore shadow limit") - assert(0) # not tested, would maybe need to restore base too if limit 0 - else: - incCodeA.addInst("s_mov_b32", sgpr("Srd%s+2"%tc), sgpr("InitialSrd%sLimit"%tc), "restore limit") + noShadowLimitCodeInLoop = self.noShadowLimitCodeInLoopA if tc == "A" else self.noShadowLimitCodeInLoopB + if noShadowLimitCodeInLoop == False: + if self.use64bShadowLimit: + incCodeA.addInst("s_mov_b32", sgpr("ShadowLimit%s+0"%tc), sgpr("InitialSrd%sLimit+0"%tc), "restore shadow limit") + incCodeA.addInst("s_mov_b32", sgpr("ShadowLimit%s+1"%tc), sgpr("InitialSrd%sLimit+1"%tc), "restore shadow limit") + assert(0) # not tested, would maybe need to restore base too if limit 0 + else: + incCodeA.addInst("s_mov_b32", sgpr("Srd%s+2"%tc), sgpr("InitialSrd%sLimit"%tc), "restore limit") # TODO - this skips over the stagger-u wrap codes @@ -15074,8 +15087,10 @@ def openPrefetchAcrossPersistent(self, kernel, isOptNLL, useBufferOOB=False): # reseting SrdA/B, ShadowLimitA/B, GlobalReadIncsA/B is more efficiently way than using BufferOOB imod.addInst("s_cmov_b32", sgpr("SrdA+2"), 0, "Set SrdA+2 to 0 for outside legal WG") imod.addInst("s_cmov_b32", sgpr("SrdB+2"), 0, "Set SrdB+2 to 0 for outside legal WG") - imod.addInst("s_cmov_b64", sgpr("ShadowLimitA", 2), 0, "Set ShadowLimitA to 0 for outside legal WG") - imod.addInst("s_cmov_b64", sgpr("ShadowLimitB", 2), 0, "Set ShadowLimitB to 0 for outside legal WG") + if self.noShadowLimitCodeInLoopA == False: + imod.addInst("s_cmov_b64", sgpr("ShadowLimitA", 2), 0, "Set ShadowLimitA to 0 for outside legal WG") + if self.noShadowLimitCodeInLoopB == False: + imod.addInst("s_cmov_b64", sgpr("ShadowLimitB", 2), 0, "Set ShadowLimitB to 0 for outside legal WG") imod.addInst("s_cmov_b32", sgpr("GlobalReadIncsA"), 0, "Stop decrementing ShadowLimitA and incrementing SrdA for outside legal WG") imod.addInst("s_cmov_b32", sgpr("GlobalReadIncsB"), 0, "Stop decrementing ShadowLimitB and incrementing SrdB for outside legal WG") else: From c1fa5b358d8cbe601754ef5ea4b695d895a34f62 Mon Sep 17 00:00:00 2001 From: Torre Zuk <42548444+TorreZuk@users.noreply.github.com> Date: Tue, 28 Nov 2023 09:02:43 -0700 Subject: [PATCH 07/51] fix for newer windows vcpkg msgpack (#1827) --- Tensile/Source/lib/CMakeLists.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Tensile/Source/lib/CMakeLists.txt b/Tensile/Source/lib/CMakeLists.txt index f8cc527c8..d3f4b697f 100644 --- a/Tensile/Source/lib/CMakeLists.txt +++ b/Tensile/Source/lib/CMakeLists.txt @@ -98,7 +98,7 @@ if(TENSILE_USE_LLVM OR TENSILE_USE_MSGPACK) endif() if(TENSILE_USE_MSGPACK) - find_package(msgpack REQUIRED) + find_package(msgpack REQUIRED NAMES msgpack msgpack-c) target_compile_definitions(TensileHost PUBLIC -DTENSILE_MSGPACK=1) if(TARGET msgpackc-cxx) From 2591802c75306f7c342c208126406cdc464e1511 Mon Sep 17 00:00:00 2001 From: Feroz Date: Tue, 28 Nov 2023 13:42:14 -0600 Subject: [PATCH 08/51] Disable HW monitor for aquvavanjaram941 (#1830) --- Tensile/Common.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/Tensile/Common.py b/Tensile/Common.py index 9baa3dccd..0aba6f5ac 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -2222,9 +2222,9 @@ def assignGlobalParameters( config ): if os.name == "nt": globalParameters["CurrentISA"] = (9,0,6) printWarning("Failed to detect ISA so forcing (gfx906) on windows") - if globalParameters["CurrentISA"] == (9,4,2) or globalParameters["CurrentISA"] == (11,0,0) or \ + if globalParameters["CurrentISA"] == (9,4,1) or globalParameters["CurrentISA"] == (9,4,2) or globalParameters["CurrentISA"] == (11,0,0) or \ globalParameters["CurrentISA"] == (11,0,1) or globalParameters["CurrentISA"] == (11,0,2): - printWarning("HardwareMonitor currently disabled for gfx942 or gfx1100/gfx1101/gfx1102") + printWarning("HardwareMonitor currently disabled for gfx941/942 or gfx1100/gfx1101/gfx1102") globalParameters["HardwareMonitor"] = False # For ubuntu platforms, call dpkg to grep the version of hip-clang. This check is platform specific, and in the future From c998961061438d11f703c47928837c7ac0a92405 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Fri, 1 Dec 2023 07:56:21 +0900 Subject: [PATCH 09/51] CI: Increase timeout for extended test (#1834) --- .jenkins/extended.groovy | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.jenkins/extended.groovy b/.jenkins/extended.groovy index 44ad373be..84a944414 100644 --- a/.jenkins/extended.groovy +++ b/.jenkins/extended.groovy @@ -45,7 +45,7 @@ def runCI = boolean formatCheck = false - prj.timeout.test = 600 + prj.timeout.test = 720 prj.defaults.ccache = false def commonGroovy From 9071c143c756c3cafa4c71f99d15b37e4b48373b Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Thu, 30 Nov 2023 16:24:44 -0700 Subject: [PATCH 10/51] Clean up old unused code, mostly related to old client (#1828) --- Tensile/BenchmarkStructs.py | 15 +- Tensile/CSVReader.py | 39 -- Tensile/ClientWriter.py | 1051 +------------------------------ Tensile/Code.py | 24 +- Tensile/Source/TensileTypes.h | 4 +- Tensile/Tensile.py | 31 +- Tensile/TensileCreateLibrary.py | 140 +--- setup.py | 9 +- 8 files changed, 10 insertions(+), 1303 deletions(-) delete mode 100644 Tensile/CSVReader.py diff --git a/Tensile/BenchmarkStructs.py b/Tensile/BenchmarkStructs.py index aad6e6b71..43a587531 100644 --- a/Tensile/BenchmarkStructs.py +++ b/Tensile/BenchmarkStructs.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2022 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -24,24 +24,13 @@ from copy import deepcopy import itertools -from .Common import print1, print2, hasParam, printExit, \ +from .Common import print1, print2, printExit, \ defaultBenchmarkCommonParameters, validParameters, globalParameters, \ defaultBatchedBenchmarkFinalProblemSizes, defaultBenchmarkFinalProblemSizes from .CustomKernels import getAllCustomKernelNames from .SolutionStructs import ProblemType, ProblemSizes -def getDefaultsForMissingParameters(paramList, defaultParams): - """Returns all parameters (with values) in defaultParams not present in paramList""" - benchmarkParams = {} - for paramDict in defaultParams: - for name, value in paramDict.items(): - if not hasParam(name, paramList) \ - or name == "ProblemSizes": - benchmarkParams[name] = value - return benchmarkParams - - def checkParametersAreValid(param, validParams): """Ensures paramaters in params exist and have valid values as specified by validParames""" (name, values) = param diff --git a/Tensile/CSVReader.py b/Tensile/CSVReader.py deleted file mode 100644 index 074805faa..000000000 --- a/Tensile/CSVReader.py +++ /dev/null @@ -1,39 +0,0 @@ -################################################################################ -# -# Copyright (C) 2016-2022 Advanced Micro Devices, Inc. All rights reserved. -# -# Permission is hereby granted, free of charge, to any person obtaining a copy -# of this software and associated documentation files (the "Software"), to deal -# in the Software without restriction, including without limitation the rights -# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell -# copies of the Software, and to permit persons to whom the Software is -# furnished to do so, subject to the following conditions: -# -# The above copyright notice and this permission notice shall be included in -# all copies or substantial portions of the Software. -# -# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR -# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, -# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE -# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER -# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, -# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE -# SOFTWARE. -# -################################################################################ - -from .Common import printExit -import csv - -def readCSV(csvFileName): - csvData = None - try: - with open(csvFileName, "r") as selectionfFile: - csvFile = csv.reader(selectionfFile) - csvData = list(csvFile) - except IOError: - printExit("Can't open \"%s\" to get data" % csvFileName) - - return csvData - - diff --git a/Tensile/ClientWriter.py b/Tensile/ClientWriter.py index 7ac7d50ef..49f8a2461 100644 --- a/Tensile/ClientWriter.py +++ b/Tensile/ClientWriter.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2022 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -25,7 +25,7 @@ from . import ClientExecutable from . import Common from . import LibraryIO -from .Common import globalParameters, pushWorkingPath, popWorkingPath, print1, printExit, CHeader, printWarning, listToInitializer, ClientExecutionLock +from .Common import globalParameters, pushWorkingPath, popWorkingPath, print1, printExit, printWarning, ClientExecutionLock from .SolutionStructs import ProblemType, ProblemSizesMock from .TensileCreateLibrary import copyStaticFiles @@ -208,20 +208,6 @@ def getBuildClientLibraryScript(buildPath, libraryLogicPath): return callCreateLibraryCmd -def writeBuildClientLibraryScript(path, libraryLogicPath): - filename = os.path.join(path, "build.%s" % ("bat" if os.name == "nt" else "sh") ) - with open(filename, "w") as file: - file.write("#!/bin/bash\n\n") - file.write("set -ex\n") - for item in getBuildClientLibraryScript(path, libraryLogicPath): - file.write(f"{item} ") - - if os.name != "nt": - os.chmod(filename, 0o777) - - return filename - - def writeRunScript(path, forBenchmark, enableTileSelection, configPaths=None): if configPaths is None: configPaths = [] @@ -274,38 +260,6 @@ def writeRunScript(path, forBenchmark, enableTileSelection, configPaths=None): return runScriptName -def toCppBool(yamlBool): - return "true" if yamlBool else "false" - -def getMaxSolutionSizes(solutions, solutionSummationSizes): - - maxK = max(solutionSummationSizes) - maxMT0 = 0 - maxMT1 = 0 - for solution in solutions: - - wg = solution["WorkGroup"] - tt = solution["ThreadTile"] - mt0 = wg[0] * tt[0] - mt1 = wg[1] * tt[1] - - if (mt0 > maxMT0): - maxMT0 = mt0 - - if (mt1 > maxMT1): - maxMT1 = mt1 - - return [maxMT0, maxMT1, maxK] - -def checkConstStride(constStrideMap, keyIdx): - finalVal = None - for (mapIdx, val) in constStrideMap: - if keyIdx == mapIdx: - finalVal = val - #print ("idx=", keyIdx, "=", finalVal) - return finalVal - - def problemSizeParams(problemType, problem): numIndices = len(problemType.indices) @@ -556,1004 +510,3 @@ def CreateBenchmarkClientParametersForSizes(libraryRootPath, problemSizes, dataF writeClientConfigIni(problemSizes, problemType, libraryRootPath, codeObjectFiles, dataFilePath, configFile) - -################################################################################ -# Write Generated Benchmark Parameters -################################################################################ -def writeClientParameters(forBenchmark, solutions, problemSizes, stepName, \ - functionList, stepBaseDir, solutionSummationSizes, solutionWriter = None): - h = "" - - ############################################################################## - # Min Naming - ############################################################################## - """ - if forBenchmark: - kernels = [] - for solution in solutions: - solutionKernels = solution.getKernels() - for kernel in solutionKernels: - if kernel not in kernels: - kernels.append(kernel) - - solutionSerialNaming = Solution.getSerialNaming(solutions) - kernelSerialNaming = Solution.getSerialNaming(kernels) - solutionMinNaming = Solution.getMinNaming(solutions) - kernelMinNaming = Solution.getMinNaming(kernels) - solutionWriter = SolutionWriter( \ - solutionMinNaming, solutionSerialNaming, \ - kernelMinNaming, kernelSerialNaming) - """ - - if forBenchmark: - if globalParameters["MergeFiles"]: - h += "#include \"Solutions.h\"\n" - else: - for solution in solutions: - solutionName = solutionWriter.getSolutionName(solution) - h += "#include \"" + solutionName + ".h\"\n" - h += "#include \"Solutions.h\"\n" - h += "#include \"ReferenceCPU.h\"\n" - h += "\n" - else: - h += "#include \"Solutions.h\"\n" - h += "#include \"Tensile.h\"\n" - - - h += "typedef enum {\n" - h += " enum_float,\n" - h += " enum_double,\n" - h += " enum_TensileComplexFloat,\n" - h += " enum_TensileComplexDouble\n" - h += "#ifdef Tensile_ENABLE_HALF\n" - h += " ,enum_TensileHalf\n" - h += "#endif\n" - h += " ,enum_TensileInt8x4\n" - h += " ,enum_TensileInt32\n" - h += " ,enum_tensile_bfloat16\n" - h += "} DataTypeEnum;\n" - h += "\n" - - h += "// Debug Params\n" - h += "const unsigned printTensorA=%x;\n" % int(globalParameters["PrintTensorA"]) - h += "const unsigned printTensorB=%x;\n" % int(globalParameters["PrintTensorB"]) - h += "const unsigned printTensorC=%x;\n" % int(globalParameters["PrintTensorC"]) - h += "const unsigned printTensorD=%x;\n" % int(globalParameters["PrintTensorD"]) - - h += "const bool printWinnersOnly=%s;\n" % toCppBool(globalParameters["PrintWinnersOnly"]) - h += "\n" - - h += "const char indexChars[%u] = \"%s" \ - % (len(globalParameters["IndexChars"])+1, \ - globalParameters["IndexChars"][0]) - for i in range(1, len(globalParameters["IndexChars"])): - h += globalParameters["IndexChars"][i] - h += "\";\n" - - h += "unsigned int functionIdx;\n" - h += "unsigned int dataTypeIdx;\n" - h += "unsigned int problemTypeIdx;\n" - h += "\n" - - ############################################################################## - # Problem Types - ############################################################################## - #dataTypes = [] - #problemTypes = [] - #functionSerialToDataTypeAndIdx = [] - dataTypes = [] - problemTypes = [] - destDataTypes = {} - computeDataTypes = {} - problemTypesForDataType = {} # for data type - schedulesForProblemType = {} # for problem type - functionInfo = [] # dataTypeIdx, problemTypeIdx, idxWithinDataType, idxWithinProblemType - #tileSelection = False - - if forBenchmark: - problemType = solutions[0]["ProblemType"] - dataType = problemType["DataType"] - #tileSelection = problemType["TileAwareSelection"] - - destDataType = problemType["DestDataType"] - destDataTypes[dataType] = destDataType - - computeDataType = problemType["ComputeDataType"] - computeDataTypes[dataType] = computeDataType - - dataTypes.append(dataType) - - problemTypes.append(problemType) - problemTypesForDataType[dataType] = [problemType] - schedulesForProblemType[problemType] = solutions - numProblemTypes = 1 - for solution in solutions: - functionInfo.append([ 0, 0, 0, 0, 0, 0 ]) - else: - for functionIdx in range(0, len(functionList)): - function = functionList[functionIdx] - scheduleName = function[0] - problemType = function[1] - dataType = problemType["DataType"] - destDataType = problemType["DestDataType"] - computeDataType = problemType["ComputeDataType"] - if dataType not in dataTypes: - dataTypes.append(dataType) - destDataTypes[dataType] = destDataType - computeDataTypes[dataType] = computeDataType - problemTypesForDataType[dataType] = [] - if problemType not in problemTypesForDataType[dataType]: - problemTypesForDataType[dataType].append(problemType) - schedulesForProblemType[problemType] = [] - schedulesForProblemType[problemType].append(scheduleName) - - # sort - dataTypes = sorted(dataTypes) - for dataType in dataTypes: - problemTypesForDataType[dataType] = \ - sorted(problemTypesForDataType[dataType],key=str) - for problemType in problemTypesForDataType[dataType]: - schedulesForProblemType[problemType] = \ - sorted(schedulesForProblemType[problemType],key=str) - - # assign info - functionIdxSerial = 0 - problemTypeIdxSerial = 0 - for dataTypeIdxSerial in range(0, len(dataTypes)): - dataType = dataTypes[dataTypeIdxSerial] - functionIdxForDataType = 0 - for problemTypeIdxForDataType in range(0, \ - len(problemTypesForDataType[dataType])): - problemType = \ - problemTypesForDataType[dataType][problemTypeIdxForDataType] - problemTypes.append(problemType) - functionIdxForProblemType = 0 - for functionIdxForProblemType in range(0, \ - len(schedulesForProblemType[problemType])): - functionInfo.append([ \ - dataTypeIdxSerial, \ - problemTypeIdxForDataType, \ - problemTypeIdxSerial, \ - functionIdxSerial,\ - functionIdxForDataType,\ - functionIdxForProblemType, \ - ]) - functionIdxForProblemType += 1 - functionIdxForDataType += 1 - functionIdxSerial += 1 - problemTypeIdxSerial += 1 - numProblemTypes = problemTypeIdxSerial - numFunctions = functionIdxSerial - h += "const unsigned int numFunctions = %u;\n" % numFunctions - - ############################################################################## - # Data Types - ############################################################################## - h += "/* data types */\n" - numDataTypes = len(dataTypes) - h += "const unsigned int numDataTypes = %u;\n" % numDataTypes - h += "const DataTypeEnum dataTypeEnums[numDataTypes] = { enum_%s" \ - % dataTypes[0].toCpp() - for dataTypeIdx in range(1, numDataTypes): - h += ", enum_%s" % dataTypes[dataTypeIdx].toCpp() - h += " };\n" - # bytes per elements - h += "const unsigned int bytesPerElement[numDataTypes] = { %u" \ - % (dataTypes[0].numBytes()) - for dataTypeIdx in range(1, numDataTypes): - dataType = dataTypes[dataTypeIdx] - h += ", %u" % dataType.numBytes() - h += " };\n" - # flops per mac - if dataTypes[0].isInt8x4(): - h += "const unsigned int numFlopsPerMac[numDataTypes] = { %u" % (8 if dataTypes[0].isReal() else 32) - else: - h += "const unsigned int numFlopsPerMac[numDataTypes] = { %u" % (2 if dataTypes[0].isReal() else 8) - for dataTypeIdx in range(1, numDataTypes): - dataType = dataTypes[dataTypeIdx] - h += ", %u" % (2 if dataType.isReal() else 8) - h += " };\n" - for dataTypeIdx in range(0, numDataTypes): - h += "#define Tensile_DATA_TYPE_%s\n" \ - % dataTypes[dataTypeIdx].toCpp().upper() - - ############################################################################## - # Problem Types - ############################################################################## - h += "/* problem types */\n" - h += "const unsigned int numProblemTypes = %u;\n" % numProblemTypes - # Num C Indices - h += "const unsigned int numIndicesC[numProblemTypes] = { %u" \ - % problemTypes[0]["NumIndicesC"] - for problemTypeIdx in range(1, numProblemTypes): - problemType = problemTypes[problemTypeIdx] - h += ", %u" % problemType["NumIndicesC"] - h += " };\n" - - # Num AB Indices - maxNumIndicesA = len(problemTypes[0]["IndexAssignmentsA"]) - maxNumIndicesB = len(problemTypes[0]["IndexAssignmentsB"]) - h += "const unsigned int numIndicesA[numProblemTypes] = { %u" \ - % len(problemTypes[0]["IndexAssignmentsA"]) - for problemTypeIdx in range(1, numProblemTypes): - problemType = problemTypes[problemTypeIdx] - numIndicesA = len(problemType["IndexAssignmentsA"]) - h += ", %u" % numIndicesA - maxNumIndicesA = max(numIndicesA, maxNumIndicesA) - h += " };\n" - h += "const unsigned int maxNumIndicesA = %u;\n" % maxNumIndicesA - - h += "const unsigned int numIndicesB[numProblemTypes] = { %u" \ - % len(problemTypes[0]["IndexAssignmentsB"]) - for problemTypeIdx in range(1, numProblemTypes): - problemType = problemTypes[problemTypeIdx] - numIndicesB = len(problemType["IndexAssignmentsB"]) - h += ", %u" % numIndicesB - maxNumIndicesB = max(numIndicesB, maxNumIndicesB) - h += " };\n" - h += "const unsigned int maxNumIndicesB = %u;\n" % maxNumIndicesB - - # Index Assignments A - h += "const unsigned int indexAssignmentsA[numProblemTypes][maxNumIndicesA] = {\n" - for problemTypeIdx in range(0, numProblemTypes): - problemType = problemTypes[problemTypeIdx] - indices = problemType["IndexAssignmentsA"] - h += " { %u" % indices[0] - for i in range(1, maxNumIndicesA): - if i < len(indices): - h += ", %u" % indices[i] - else: - h += ", static_cast(-1)" - if problemTypeIdx < numProblemTypes-1: - h += " },\n" - else: - h += " }\n" - h += "};\n" - # Index Assignments B - h += "const unsigned int indexAssignmentsB[numProblemTypes][maxNumIndicesB] = {\n" - for problemTypeIdx in range(0, numProblemTypes): - problemType = problemTypes[problemTypeIdx] - indices = problemType["IndexAssignmentsB"] - h += " { %u" % indices[0] - for i in range(1, maxNumIndicesB): - if i < len(indices): - h += ", %u" % indices[i] - else: - h += ", static_cast(-1)" - if problemTypeIdx < numProblemTypes-1: - h += " },\n" - else: - h += " }\n" - h += "};\n" - # Index Assignments LD - h += "const unsigned int numIndicesLD = %u;\n" % problemType["NumIndicesLD"] - h += "const unsigned int indexAssignmentsLD[numIndicesLD] = {" - if problemType["NumIndicesLD"] > 0: - h += " %u" % problemType["IndexAssignmentsLD"][0] - for ldIdx in range(1, len(problemType["IndexAssignmentsLD"])): - h += ", %u" % problemType["IndexAssignmentsLD"][ldIdx] - h += "};\n" - # beta - h += "bool useBeta[numProblemTypes] = { %s" \ - % ("true" if problemTypes[0]["UseBeta"] else "false") - for problemTypeIdx in range(1, numProblemTypes): - problemType = problemTypes[problemTypeIdx] - h += ", %s" % ("true" if problemType["UseBeta"] else "false") - h += " };\n" - # Complex Conjugates - h += "const bool complexConjugateA[numProblemTypes] = { %s" \ - % ("true" if problemTypes[0]["ComplexConjugateA"] else "false" ) - for problemTypeIdx in range(1, numProblemTypes): - problemType = problemTypes[problemTypeIdx] - h += ", %s" % ("true" if problemTypes[0]["ComplexConjugateA"] else "false" ) - h += " };\n" - h += "const bool complexConjugateB[numProblemTypes] = { %s" \ - % ("true" if problemTypes[0]["ComplexConjugateB"] else "false" ) - for problemTypeIdx in range(1, numProblemTypes): - problemType = problemTypes[problemTypeIdx] - h += ", %s" % ("true" if problemTypes[0]["ComplexConjugateB"] else "false" ) - h += " };\n" - h += "\n" - - if not forBenchmark: - h += "// dataTypeIdxSerial, problemTypeIdxForDataType, problemTypeIdxSerial, functionIdxSerial, functionIdxForDataType, functionIdxForProblemType\n" - first = True - h += "const unsigned int functionInfo[numFunctions][6] = {\n" - for info in functionInfo: - h += "%s{ %u, %u, %u, %u, %u, %u }" % (" " if first else ",\n ", \ - info[0], info[1], info[2], info[3], info[4], info[5] ) - first = False - h += " };\n" - - - ############################################################################## - # Problem Sizes - ############################################################################## - maxNumIndices = problemTypes[0]["TotalIndices"] - if not forBenchmark: - for problemType in problemTypes: - maxNumIndices = max(problemType["TotalIndices"], maxNumIndices) - h += "const unsigned int maxNumIndices = %u;\n" % maxNumIndices - h += "const unsigned int totalIndices[numProblemTypes] = { %u" \ - % problemTypes[0]["TotalIndices"] - for problemTypeIdx in range(1, numProblemTypes): - h += ", %u" % problemTypes[problemTypeIdx]["TotalIndices"] - h += " };\n" - if forBenchmark: - h += "const unsigned int numProblems = %u;\n" \ - % problemSizes.totalProblemSizes - h += "const unsigned int problemSizes[numProblems][%u] = {\n" \ - % (problemTypes[0]["TotalIndices"] + problemType["NumIndicesLD"]) - for i in range(problemSizes.totalProblemSizes): - #assert problemSizes.problems[i].stridesA == None # new stride functionality only supported on new client, not here - problemSize = problemSizes.problems[i].sizes - line = " {%5u" %problemSize[0] - for j in range(1, problemTypes[0]["TotalIndices"] + problemType["NumIndicesLD"]): - line += ",%5u" % problemSize[j] - line += " }" - h += line - if i < problemSizes.totalProblemSizes-1: - h += "," - else: - h += "" - h += "};\n" - h += "const unsigned int minStrides[%u] = {" \ - % problemTypes[0]["TotalIndices"] - for i in range(0, len(problemSizes.minStrides)): - if (i!=0): - h += ", " - h += str(problemSizes.minStrides[i]) - h += "};\n" - else: - h += "unsigned int userSizes[maxNumIndices];\n" - h += "unsigned int minStrides[%u] = {" \ - % maxNumIndices - for i in range(0, maxNumIndices): - if (i!=0): - h += ", " - h += str(0); # always use 0 for minStrides in benchmark mode - h += "};\n" - - if forBenchmark: - h += "/* problem sizes */\n" - """ - h += "const bool indexIsSized[maxNumIndices] = {" - for i in range(0, problemSizes.totalIndices): - h += " %s" % ("true" if problemSizes.indexIsSized[i] else "false") - if i < problemSizes.totalIndices-1: - h += "," - h += " };\n" - - h += "const unsigned int numIndicesSized = %u;\n" \ - % len(problemSizes.indicesSized) - h += "const unsigned int indicesSized[numIndicesSized][4] = {\n" - h += "// { min, stride, stride_incr, max }\n" - for i in range(0, len(problemSizes.indicesSized)): - r = problemSizes.indicesSized[i] - h += " { %u, %u, %u, %u }" % (r[0], r[1], r[2], r[3]) - if i < len(problemSizes.indicesSized)-1: - h += "," - h += "\n" - h += " };\n" - - numIndicesMapped = len(problemSizes.indicesMapped) - h += "const unsigned int numIndicesMapped = %u;\n" % numIndicesMapped - if numIndicesMapped > 0: - h += "#define Tensile_INDICES_MAPPED 1\n" - h += "const unsigned int indicesMapped[numIndicesMapped] = {" - for i in range(0, numIndicesMapped): - h += " %u" % problemSizes.indicesMapped[i] - if i < numIndicesMapped-1: - h += "," - h += " };\n" - else: - h += "#define Tensile_INDICES_MAPPED 0\n" - """ - - ############################################################################## - # Max Problem Sizes - ############################################################################## - if forBenchmark: - maximumD = problemSizes.maxD - maximumC = problemSizes.maxC - maximumA = problemSizes.maxA - maximumB = problemSizes.maxB - maximumW = problemSizes.maxD * 32; - - maxMT = getMaxSolutionSizes(solutions, solutionSummationSizes) - - maxMN = 1296 * maxMT[0] * maxMT[1] - maxMK = 36 * maxMT[0] * maxMT[2] - maxNK = 36 * maxMT[1] * maxMT[2] - - maximumA = max(maximumA, maxMK) - maximumB = max(maximumB, maxNK) - maximumC = max(maximumC, maxMN) - maximumD = max(maximumD, maxMN) - maximumW = max(maximumW, maxMN) - - h += "size_t maxSizeD = %u;\n" % (maximumD) - h += "size_t maxSizeC = %u;\n" % (maximumC) - h += "size_t maxSizeA = %u;\n" % (maximumA) - h += "size_t maxSizeB = %u;\n" % (maximumB) - h += "size_t maxSizeW = %u;\n" % (maximumW) - h += "\n" - else: - h += "size_t maxSizeD;\n" - h += "size_t maxSizeC;\n" - h += "size_t maxSizeA;\n" - h += "size_t maxSizeB;\n" - h += "size_t maxSizeW;\n" - h += "\n" - - ############################################################################## - # Current Problem Size - ############################################################################## - h += "/* current problem size */\n" - #h += "unsigned int fullSizes[maxNumIndices];\n" - #h += "unsigned int currentSizedIndexSizes[numIndicesSized];\n" - #h += "unsigned int currentSizedIndexIncrements[numIndicesSized];\n" - h += "\n" - - ############################################################################## - # Solutions - ############################################################################## - if forBenchmark: - # Solution Ptrs - h += "/* solutions */\n" - # Problem Type Indices - h += "const unsigned int maxNumSolutions = %u;\n" % len(solutions) - h += "float solutionPerf[numProblems][maxNumSolutions]; // milliseconds\n" - h += "\n" - - h += "static const SolutionInfo solutions[maxNumSolutions] = {\n" - for i in range(0, len(solutions)): - solution = solutions[i] - solutionName = solutionWriter.getSolutionName(solution) - h += " {(void*)%s, \"%s\", {%d, %d, %d, %d, %s, %d, %d} }" % \ - (solutionName, solutionName, - solution["AssertSummationElementMultiple"], - solution["AssertFree0ElementMultiple"], - solution["AssertFree1ElementMultiple"], - solution["AssertMinApproxSize"], - "false", - solution["PackBatchDims"]==2, \ - solution["PackBatchDims"]==1, \ - ) - if i < len(solutions)-1: - h += "," - h += "\n" - h += " };\n" - h += "\n" - - numSummations = len(solutionSummationSizes) - h += "const unsigned int numSummations = %d;\n" % (numSummations) - - h += "const unsigned int summations[numSummations] = {%d" % (solutionSummationSizes[0]) - for i in range(1, numSummations): - h += ", %d" % (solutionSummationSizes[i]) - h += "};\n" - - ############################################################################## - # Solution meta data - ############################################################################## - - transA = solutions[0]["ProblemType"]["TransposeA"] - transB = solutions[0]["ProblemType"]["TransposeB"] - h += "const unsigned int solutionMetaData[maxNumSolutions][10] = {\n" - for i in range(0, len(solutions)): - solution = solutions[i] - - wg = solution["WorkGroup"] - tt = solution["ThreadTile"] - mt0 = wg[0] * tt[0] - mt1 = wg[1] * tt[1] - gsu = solution["GlobalSplitU"] - lsu = wg[2] - - h += " {%d, %d, %d, %d, %d, %d, %d, %d, %d, %d}" % (mt0,mt1,tt[0],tt[1],wg[0],wg[1],transA,transB,gsu,lsu) - - if (i < len(solutions) - 1): - h += ",\n" - else: - h += "\n" - h += " };\n" - h += "\n" - - - - else: - # Function Names - functionNames = [] - for dataType in dataTypes: - for problemType in problemTypesForDataType[dataType]: - # example scheduleName is fiji, vega10, etc - for scheduleName in schedulesForProblemType[problemType]: - functionNames.append("tensile_%s" % (problemType)) - h += "const char *functionNames[numFunctions] = {\n" - for functionIdx in range(0, len(functionNames)): - functionName = functionNames[functionIdx] - h += " \"%s\"%s\n" % (functionName, \ - "," if functionIdx < len(functionNames)-1 else "" ) - h += " };\n" - - ############################################################################## - # Runtime Structures - ############################################################################## - h += "/* runtime structures */\n" - h += "TensileStatus status;\n" - if globalParameters["RuntimeLanguage"] == "OCL": - h += "cl_platform_id platform;\n" - h += "cl_device_id device;\n" - h += "cl_context context;\n" - h += "cl_command_queue stream;\n" - else: - h += "hipStream_t stream;\n" - #h += "int deviceIdx = %u;\n" \ - # % (globalParameters["Device"]) - h += "\n" - h += "void *deviceWS;\n" - h += "void *deviceD;\n" - h += "void *deviceC;\n" - h += "void *deviceA;\n" - h += "void *deviceB;\n" - - ############################################################################## - # Benchmarking and Validation Parameters - ############################################################################## - h += "\n/* benchmarking parameters */\n" - #h += "const bool measureKernelTime = %s;\n" \ - # % ("true" if globalParameters["KernelTime"] else "false") - #h += "const unsigned int numEnqueuesPerSync = %u;\n" \ - # % (globalParameters["EnqueuesPerSync"]) - #h += "const unsigned int numSyncsPerBenchmark = %u;\n" \ - # % (globalParameters["SyncsPerBenchmark"]) - #h += "unsigned int numElementsToValidate = %s;\n" \ - # % (str(globalParameters["NumElementsToValidate"]) \ - # if globalParameters["NumElementsToValidate"] >= 0 \ - # else "0xFFFFFFFF" ) - #h += "unsigned int validationMaxToPrint = %u;\n" \ - # % globalParameters["ValidationMaxToPrint"] - #h += "bool validationPrintValids = %s;\n" \ - # % ("true" if globalParameters["ValidationPrintValids"] else "false") - h += "size_t validationStride;\n" - if problemType["HighPrecisionAccumulate"]: - h += "static bool useHighPrecisionAccumulate = true;\n" - else: - h += "static bool useHighPrecisionAccumulate = false;\n" - #h += "unsigned int dataInitTypeC = %s;\n" % globalParameters["DataInitTypeC"] - #h += "unsigned int dataInitTypeAB = %s;\n" % globalParameters["DataInitTypeAB"] - h += "\n" - - ############################################################################## - # Generated Call to Reference - ############################################################################## - h += "/* generated call to reference */\n" - h += "template\n" - h += "TensileStatus generatedCallToReferenceCPU(\n" - h += " const unsigned int *sizes,\n" - h += " const unsigned int *minStrides,\n" - h += " DestDataType *referenceD,\n" - h += " DestDataType *referenceC,\n" - h += " DataType *initialA,\n" - h += " DataType *initialB,\n" - h += " const unsigned int lda,\n" - h += " const unsigned int ldb,\n" - h += " const unsigned int ldc,\n" - h += " const unsigned int ldd,\n" - h += " const unsigned int stride_a,\n" - h += " const unsigned int stride_b,\n" - h += " const unsigned int stride_c,\n" - h += " const unsigned int stride_d,\n" - h += " ComputeDataType alpha,\n" - h += " ComputeDataType beta,\n" - h += " bool useHighPrecisionAccumulate) {\n" - h += " return tensileReferenceCPU(\n" - h += " referenceD,\n" - h += " referenceC,\n" - h += " initialA,\n" - h += " initialB,\n" - h += " lda,\n" - h += " ldb,\n" - h += " ldc,\n" - h += " ldd,\n" - h += " stride_a,\n" - h += " stride_b,\n" - h += " stride_c,\n" - h += " stride_d,\n" - h += " alpha,\n" - h += " beta,\n" - h += " totalIndices[problemTypeIdx],\n" - h += " sizes,\n" - h += " minStrides,\n" - h += " numIndicesC[problemTypeIdx],\n" - h += " numIndicesA[problemTypeIdx],\n" - h += " numIndicesB[problemTypeIdx],\n" - h += " indexAssignmentsA[problemTypeIdx],\n" - h += " indexAssignmentsB[problemTypeIdx],\n" - h += " complexConjugateA[problemTypeIdx],\n" - h += " complexConjugateB[problemTypeIdx],\n" - h += " validationStride,\n" - h += " useHighPrecisionAccumulate);\n" - h += "};\n" - h += "\n" - - ############################################################################## - # Generated Call to Solution - ############################################################################## - if forBenchmark: - problemType = solutions[0]["ProblemType"] - h += "/* generated call to solution */\n" - h += "template\n" - h += "TensileStatus generatedCallToSolution(\n" - h += " const SolutionInfoType &solution,\n" - h += " SolutionLock *solutionLock,\n" - h += " const unsigned int *sizes,\n" - h += " const unsigned int *minStrides,\n" - h += " const unsigned int lda,\n" - h += " const unsigned int ldb,\n" - h += " const unsigned int ldc,\n" - h += " const unsigned int ldd,\n" - h += " const unsigned int stride_a,\n" - h += " const unsigned int stride_b,\n" - h += " const unsigned int stride_c,\n" - h += " const unsigned int stride_d,\n" - h += " ComputeDataType alpha,\n" - h += " ComputeDataType beta,\n" - h += " unsigned int numEvents = 0,\n" - if globalParameters["RuntimeLanguage"] == "OCL": - h += " cl_event *event_wait_list = NULL,\n" - h += " cl_event *outputEvent = NULL ) {\n" - else: - h += " hipEvent_t *startEvent = NULL,\n" - h += " hipEvent_t *stopEvent = NULL ) {\n" - - h += " // calculate parameters assuming packed data\n" - # strides - indexChars = globalParameters["IndexChars"] - firstStride = 1 - #assert(not problemType["UseInitialStridesCD"]) # not supported in old client - if problemType["UseInitialStridesAB"]: - firstStride = 0 - lastStrideD = problemType["NumIndicesC"] - lastStrideC = problemType["NumIndicesC"] - lastStrideA = len(problemType["IndexAssignmentsA"]) - lastStrideB = len(problemType["IndexAssignmentsB"]) - - # calculate strides - for i in range(0,lastStrideD): - h += " unsigned int strideD%u%s = 1" % (i, indexChars[i]) - for j in range(0, i): - h += " * (" - if j == 0: - h += "(ldd != std::numeric_limits::max()) ? ldd : " - h += "std::max(minStrides[%i], sizes[%i]))" % (j,j) - h += ";\n" - h += " if (stride_d != std::numeric_limits::max()) strideD%u%s = stride_d;\n" % (lastStrideD-1, indexChars[lastStrideD-1]) - for i in range(0,lastStrideC): - h += " unsigned int strideC%u%s = 1 " % (i, indexChars[i]) - for j in range(0, i): - h += " * (" - if j == 0: - h += "(ldc != std::numeric_limits::max()) ? ldc : " - h+= "std::max(minStrides[%i], sizes[%i]))" % (j,j) - h += ";\n" - h += " if (stride_c != std::numeric_limits::max()) strideC%u%s = stride_c;\n" % (lastStrideC-1, indexChars[lastStrideC-1]) - - constStride = None - for i in range(0,lastStrideA): - idx = problemType["IndexAssignmentsA"][i] - constStride = checkConstStride(problemType["SetConstStrideA"], idx) - if constStride != None: - h += " unsigned int strideA%u%s = %d; //SetConstStrideA\n" % (i, - indexChars[problemType["IndexAssignmentsA"][i]], - constStride) - else: - h += " unsigned int strideA%u%s = 1" % (i, \ - indexChars[problemType["IndexAssignmentsA"][i]]) - for j in range(0, i): - h += " * (" - if j == 0: - h += "(lda != std::numeric_limits::max()) ? lda : " - h += "std::max(minStrides[%i], sizes[%i]))" % \ - (problemType["IndexAssignmentsA"][j], - problemType["IndexAssignmentsA"][j]) - h += ";\n" - if constStride == None: - h += " if (stride_a != std::numeric_limits::max()) strideA%u%s = stride_a;\n" % (lastStrideA-1, indexChars[problemType["IndexAssignmentsA"][lastStrideA-1]]) - - for i in range(0,lastStrideB): - idx = problemType["IndexAssignmentsB"][i] - constStride = checkConstStride(problemType["SetConstStrideB"], idx) - if constStride != None: - h += " unsigned int strideB%u%s = %d; //SetConstStrideB\n" % (i, - indexChars[problemType["IndexAssignmentsB"][i]], - constStride) - else: - h += " unsigned int strideB%u%s = 1" % (i, \ - indexChars[problemType["IndexAssignmentsB"][i]]) - for j in range(0, i): - h += " * (" - if j == 0: - h += "(ldb != std::numeric_limits::max()) ? ldb : " - h+= "std::max(minStrides[%i], sizes[%i]))" % \ - (problemType["IndexAssignmentsB"][j], - problemType["IndexAssignmentsB"][j]) - h += ";\n" - h += " if (stride_b != std::numeric_limits::max()) strideB%u%s = stride_b;\n" % (lastStrideB-1, indexChars[problemType["IndexAssignmentsB"][lastStrideB-1]]) - - for i in range(0, problemType["TotalIndices"]): - h += " unsigned int size%s = sizes[%u];\n" % (indexChars[i], i) - h += "\n" - - - # function call - h += " // Check assertions,\n" - assert(not problemType["UseInitialStridesCD"]) # not supported in old client - firstStride = 0 if problemType["UseInitialStridesAB"] else 1 - lastStrideD = problemType["NumIndicesC"] - lastStrideC = problemType["NumIndicesC"] - lastStrideA = len(problemType["IndexAssignmentsA"]) - lastStrideB = len(problemType["IndexAssignmentsB"]) - numSizes = problemType["TotalIndices"] - h += " typedef ProblemDims<%u,%u,%u,%u,%u,%u> ProblemDims_%s;\n" \ - % (firstStride, lastStrideD, lastStrideC, lastStrideA, lastStrideB, numSizes, problemType) - # TODO - this should be initialized somewhere once? - h += " static const ProblemType problemType( " - h += listToInitializer(problemType["IndicesFree"]) + ", " - h += listToInitializer(problemType["IndicesSummation"]) + ", " - h += listToInitializer(problemType["IndicesBatch"]) + ', ' - h += listToInitializer(problemType["IndexAssignmentsA"]) + ', ' - h += listToInitializer(problemType["IndexAssignmentsB"]) - h += ");\n" - # create problem size - TODO could move this up to the caller - h += " ProblemDims_%s pdims(" % problemType - indexChars = globalParameters["IndexChars"] - for i in range(firstStride,lastStrideD): - if i != firstStride: h += ", " - h += "strideD%u%s" % (i, indexChars[i]) - for i in range(firstStride,lastStrideC): - h += ", strideC%u%s" % (i, indexChars[i]) - for i in range(firstStride,lastStrideA): - h += ", strideA%u%s" % (i, \ - indexChars[problemType["IndexAssignmentsA"][i]]) - for i in range(firstStride,lastStrideB): - h += ", strideB%u%s" % (i, \ - indexChars[problemType["IndexAssignmentsB"][i]]) - for i in range(0, problemType["TotalIndices"]): - h += ", size%s" % indexChars[i] - h += ");\n" - h += " if (!ProblemProperties(pdims,&problemType).validForSolution(solution._assertionRequirements))\n" - h += " return tensileStatusAssertFailure; // problem dims did not meet requirements for solution\n" - h += "\n" - - h += " // call solution function\n" - h += " TensileSolutionPointer_%s f = reinterpret_cast (solution._functionPtr);\n" \ - % (problemType, problemType) - if globalParameters["RuntimeLanguage"] == "OCL": - h += " return f(solutionLock, static_cast(deviceD), static_cast(deviceC), static_cast(deviceA), static_cast(deviceB),\n" - else: - typeName = dataTypes[0].toCpp() - destTypeName = destDataTypes[dataType].toCpp() - computeTypeName = computeDataTypes[dataType].toCpp() - h += " return f(solutionLock,\n" - h += " static_cast<%s *>(deviceD),\n" % destTypeName - h += " static_cast<%s *>(deviceC),\n" % destTypeName - h += " static_cast<%s *>(deviceA),\n" % typeName - h += " static_cast<%s *>(deviceB),\n" % typeName - h += " alpha,\n" - if problemType["UseBeta"]: - h += " beta,\n" - for i in range(firstStride,lastStrideD): - h += " strideD%u%s,\n" % (i, indexChars[i]) - for i in range(firstStride,lastStrideC): - h += " strideC%u%s,\n" % (i, indexChars[i]) - for i in range(firstStride,lastStrideA): - h += " strideA%u%s,\n" % (i, \ - indexChars[problemType["IndexAssignmentsA"][i]]) - for i in range(firstStride,lastStrideB): - h += " strideB%u%s,\n" % (i, \ - indexChars[problemType["IndexAssignmentsB"][i]]) - for i in range(0, problemType["TotalIndices"]): - h += " size%s,\n" % indexChars[i] - h += " stream,\n" - if globalParameters["RuntimeLanguage"] == "OCL": - h += " numEvents, event_wait_list, outputEvent ); // events\n" - else: - h += " numEvents,\n" - h += " startEvent,\n" - h += " stopEvent,\n" - h += " static_cast(deviceWS)); // events\n" - - h += "};\n" - h += "\n" - else: - ############################################################################ - # Generated Call to Function - ############################################################################ - for enqueue in [True, False]: - functionName = "tensile" if enqueue else "tensileGetSolutionName" - returnName = "TensileStatus" if enqueue else "const char *" - h += "/* generated call to function */\n" - h += "template\n" - h += "%s generatedCallTo_%s(\n" % (returnName, functionName) - h += " unsigned int *sizes,\n" - h += " unsigned int *minStrides,\n" - h += " ComputeDataType alpha,\n" - h += " ComputeDataType beta,\n" - h += " unsigned int lda,\n" - h += " unsigned int ldb,\n" - h += " unsigned int ldc,\n" - h += " unsigned int ldd,\n" - h += " unsigned int strideA,\n" - h += " unsigned int strideB,\n" - h += " unsigned int strideC,\n" - h += " unsigned int strideD,\n" - h += " unsigned int numEvents = 0,\n" - - if globalParameters["RuntimeLanguage"] == "OCL": - h += " cl_event *event_wait_list = NULL,\n" - h += " cl_event *outputEvent = NULL );\n\n" - else: - h += " hipEvent_t *startEvent = NULL,\n" - h += " hipEvent_t *stopEvent = NULL );\n\n" - - -#need to get DestDataType in here - for dataType in dataTypes: - typeName = dataType.toCpp() - destDataType = destDataTypes[dataType] - destTypeName = destDataType.toCpp() - computeDataType = computeDataTypes[dataType] - computeTypeName = computeDataType.toCpp() - functionsForDataType = [] - for problemType in problemTypesForDataType[dataType]: - for scheduleName in schedulesForProblemType[problemType]: - functionsForDataType.append([scheduleName, problemType]) - h += "template<>\n" - h += "inline %s generatedCallTo_%s<%s, %s, %s>(\n" \ - % (returnName, functionName, typeName, destTypeName, computeTypeName) - h += " unsigned int *sizes,\n" - h += " unsigned int *minStrides,\n" - h += " %s alpha,\n" % computeTypeName - h += " %s beta,\n" % computeTypeName - h += " unsigned int lda,\n" - h += " unsigned int ldb,\n" - h += " unsigned int ldc,\n" - h += " unsigned int ldd,\n" - h += " unsigned int strideA,\n" - h += " unsigned int strideB,\n" - h += " unsigned int strideC,\n" - h += " unsigned int strideD,\n" - h += " unsigned int numEvents, \n" - - if globalParameters["RuntimeLanguage"] == "OCL": - h += " cl_event *event_wait_list,\n" - h += " cl_event *outputEvent ) {\n\n" - else: - h += " hipEvent_t *startEvent,\n" - h += " hipEvent_t *stopEvent ) {\n\n" - - h += " unsigned int functionIdxForDataType = functionInfo[functionIdx][4];\n" - - for functionIdx in range(0, len(list(functionsForDataType))): - function = functionsForDataType[functionIdx] - scheduleName = function[0] - problemType = function[1] - if len(list(functionsForDataType))> 1: - if functionIdx == 0: - h += " if (functionIdxForDataType == %u) {\n" % functionIdx - elif functionIdx == len(list(functionsForDataType))-1: - h += " } else {\n" - else: - h += " } else if (functionIdxForDataType == %u) {\n" \ - % functionIdx - - # strides - indexChars = globalParameters["IndexChars"] - firstStride = 1 - assert(not problemType["UseInitialStridesCD"]) # not supported in old client - if problemType["UseInitialStridesAB"]: - firstStride = 0 - lastStrideD = problemType["NumIndicesC"] - lastStrideC = problemType["NumIndicesC"] - lastStrideA = len(problemType["IndexAssignmentsA"]) - lastStrideB = len(problemType["IndexAssignmentsB"]) - - # calculate strides - for i in range(0,lastStrideD): - h += " unsigned int strideD%u%s = 1" % (i, indexChars[i]) - for j in range(0, i): - h += "*sizes[%i]" % j - h += ";\n" - h += " if (strideD != std::numeric_limits::max()) strideD%u%s = strideD;\n" % (lastStrideD-1, indexChars[lastStrideD-1]) - for i in range(0,lastStrideC): - h += " unsigned int strideC%u%s = 1" % (i, indexChars[i]) - for j in range(0, i): - h += "*sizes[%i]" % j - h += ";\n" - h += " if (strideC != std::numeric_limits::max()) strideC%u%s = strideC;\n" % (lastStrideC-1, indexChars[lastStrideC-1]) - - for i in range(0,lastStrideA): - h += " unsigned int strideA%u%s = 1" % (i, \ - indexChars[problemType["IndexAssignmentsA"][i]]) - for j in range(0, i): - h += "*sizes[%i]" % \ - problemType["IndexAssignmentsA"][j] - h += ";\n" - h += " if (strideA != std::numeric_limits::max()) strideA%u%s = strideA;\n" % (lastStrideA-1, indexChars[problemType["IndexAssignmentsA"][lastStrideA-1]]) - for i in range(0,lastStrideB): - h += " unsigned int strideB%u%s = 1" % (i, \ - indexChars[problemType["IndexAssignmentsB"][i]]) - for j in range(0, i): - h += "*sizes[%i]" % \ - problemType["IndexAssignmentsB"][j] - h += ";\n" - h += " if (strideB != std::numeric_limits::max()) strideB%u%s = strideB;\n" % (lastStrideB-1, indexChars[problemType["IndexAssignmentsB"][lastStrideB-1]]) - for i in range(0, problemType["TotalIndices"]): - h += " unsigned int size%s = sizes[%u];\n" % (indexChars[i], i) - - # function call - h += " // call solution function\n" - h += " return %s_%s(\n" % (functionName, problemType) - if enqueue: - if globalParameters["RuntimeLanguage"] == "OCL": - h += " static_cast(deviceD),\n" - h += " static_cast(deviceC),\n" - h += " static_cast(deviceA),\n" - h += " static_cast(deviceB),\n" - else: - h += " static_cast<%s *>(deviceD),\n" % destTypeName - h += " static_cast<%s *>(deviceC),\n" % destTypeName - h += " static_cast<%s *>(deviceA),\n" % typeName - h += " static_cast<%s *>(deviceB),\n" % typeName - h += " alpha,\n" - if problemType["UseBeta"]: - h += " beta,\n" - for i in range(firstStride,lastStrideD): - h += " strideD%u%s,\n" % (i, indexChars[i]) - for i in range(firstStride,lastStrideC): - h += " strideC%u%s,\n" % (i, indexChars[i]) - for i in range(firstStride,lastStrideA): - h += " strideA%u%s,\n" % (i, \ - indexChars[problemType["IndexAssignmentsA"][i]]) - for i in range(firstStride,lastStrideB): - h += " strideB%u%s,\n" % (i, \ - indexChars[problemType["IndexAssignmentsB"][i]]) - for i in range(0, problemType["TotalIndices"]): - h += " size%s%s\n" % (indexChars[i], "," if i != problemType["TotalIndices"]-1 else "") - if enqueue: - if globalParameters["RuntimeLanguage"] == "OCL": - h += ", stream, numEvents, event_wait_list, outputEvent" - else: - h += ", stream, numEvents, startEvent, stopEvent, static_cast(deviceWS)" - h += ");\n" - - if len(functionsForDataType) > 1: - h += " }\n" # close last if - h += "};\n" # close callToFunction - - ############################################################################## - # Results File Name - ############################################################################## - if forBenchmark: - h += "/* results file name */\n" - resultsFileName = os.path.join(stepBaseDir, \ - "../Data","%s.csv" % stepName) - resultsFileName = resultsFileName.replace("\\", "\\\\") - h += "const char *resultsFileName = \"%s\";\n" % resultsFileName - - granularityFileName = os.path.join(stepBaseDir, \ - "../Data","%s_Granularity.csv" % stepName) - - granularityFileName = granularityFileName.replace("\\", "\\\\") - h += "const char *granularityFileName = \"%s\";\n" % granularityFileName - - ############################################################################## - # Write File - ############################################################################## - clientParametersFile = open(os.path.join(globalParameters["WorkingPath"], \ - "ClientParameters.h"), "w") - clientParametersFile.write(CHeader) - clientParametersFile.write(h) - clientParametersFile.close() diff --git a/Tensile/Code.py b/Tensile/Code.py index 9836af685..61cc9553f 100644 --- a/Tensile/Code.py +++ b/Tensile/Code.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2022 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -28,18 +28,6 @@ # Global to print module names around strings printModuleNames = 0 -def printItemList(listOfItems, tag="__unnamed__"): - header = "="*40 - print("%s\nbegin list %s\n%s"%(header, tag, header)) - for i, item in enumerate(listOfItems): - item = list(item) if isinstance(item, tuple) else [item] - print("list[%s] %s"%(i, "-"*30)) - for j, t in enumerate(item): - ostream = t.prettyPrint() - ostream = ostream[:-1] if len(ostream)>0 and ostream[-1:] == '\n' else ostream - print(ostream) - print("%s\nend list %s\n%s"%(header, tag, header)) - class Item: """ Base class for Modules, Instructions, etc @@ -170,16 +158,6 @@ def prettyPrint(self,indent=""): | | |--GlobalReadInst bogusGlobalReadInst // comments """ - def countTypeList(self, ttypeList): - count = 0 - # add "Module" type to type list filter, where we want to count recursively - # the types under "Module" - if Module not in ttypeList: - ttypeList.append(Module) - for ttype in ttypeList: - count += self.countType(ttype) - return count - def countType(self,ttype): """ Count number of items with specified type in this Module diff --git a/Tensile/Source/TensileTypes.h b/Tensile/Source/TensileTypes.h index a1d8c29db..1550e5dfc 100644 --- a/Tensile/Source/TensileTypes.h +++ b/Tensile/Source/TensileTypes.h @@ -560,9 +560,7 @@ class ProblemType struct ProblemProperties { - // Constructor used in solution tables- - // See writeSolutionAndExactTable in TensileCreateLibrary - this constructor - // must be in-sync with the table written there. + // Constructor used in solution tables ProblemProperties(unsigned summationElementMultiple, unsigned free0ElementMultiple, unsigned free1ElementMultiple, diff --git a/Tensile/Tensile.py b/Tensile/Tensile.py index d8fa03218..53cf9740d 100644 --- a/Tensile/Tensile.py +++ b/Tensile/Tensile.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2022 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -307,35 +307,8 @@ def TensileTestPath(*args): ################################################################################ # Entry points -# the first several of these can be deprecated, only main() is used +# installed "tensile" command ################################################################################ - -# installed "tensile_rocblas_sgemm" command -def TensileROCBLASSGEMM(): - Tensile([TensileConfigPath("rocblas_sgemm.yaml"), "."]) - - -# installed "tensile_rocblas_dgemm" command -def TensileROCBLASDGEMM(): - Tensile([TensileConfigPath("rocblas_dgemm.yaml"), "."]) - - -# installed "tensile_rocblas_cgemm" command -def TensileROCBLASCGEMM(): - Tensile([TensileConfigPath("rocblas_cgemm.yaml"), "."]) - - -# installed "tensile_rocblas_zgemm" command -def TensileROCBLASZGEMM(): - Tensile([TensileConfigPath("rocblas_zgemm.yaml"), "."]) - - -# installed "tensile_sgemm" command -def TensileSGEMM5760(): - Tensile([TensileConfigPath("sgemm_5760.yaml"), "."]) - - -# installed "tensile" command def main(): Tensile(sys.argv[1:]) diff --git a/Tensile/TensileCreateLibrary.py b/Tensile/TensileCreateLibrary.py index 69a53cc65..f41714bcd 100644 --- a/Tensile/TensileCreateLibrary.py +++ b/Tensile/TensileCreateLibrary.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2022 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -622,144 +622,6 @@ def success(kernel): return codeObjectFiles -def writeSolutionAndExactTable(scheduleName, deviceNames, schedProbName, problemType, \ - solutionsForSchedule, solutionNames, exactLogic): - s = "" - s += "namespace { // Start schedule '%s'\n" % scheduleName - - s += "// solution table - function, name, assertion requirements\n" - s += "static const SolutionInfo solutionTable_%s[] = {\n" % (schedProbName) - for i in range(0, len(solutionsForSchedule)): - solution = solutionsForSchedule[i] - solutionName = solutionNames[i] - s += " {(void*)%s, \"%s\", {%d, %d, %d, %d, %d, %d, %d} }%s // %d" % \ - (solutionName, solutionName, \ - solution["AssertSummationElementMultiple"], \ - solution["AssertFree0ElementMultiple"], \ - solution["AssertFree1ElementMultiple"], \ - solution["AssertMinApproxSize"], \ - False, \ - solution["PackBatchDims"]==2, \ - solution["PackBatchDims"]==1, \ - "," if i < len(solutionsForSchedule)-1 else "", \ - i) - s += "\n" - - s += "};\n\n" - - # Write the exact problems here - s += "// table of exact problem dims and selected solutionIdx\n" - s += "static const std::pair embeddedExactTable_%s[] = {\n" % (problemType,schedProbName) - numSizes = problemType["TotalIndices"] - for ruleIdx in range(0, len(exactLogic)): - rule = exactLogic[ruleIdx] - problemSize = rule[0][:numSizes] - solutionIdx = rule[1][0] - solutionGFlops = rule[1][1] - s += " { {" - for i in range(0, len(problemSize)): - if i == 0: - s += "%u" % problemSize[i] - else: - s += ", %u" % problemSize[i] - s += "}, %u}" % (solutionIdx) - s += "," if ruleIdx != len(exactLogic)-1 else " " - s += " // %.0f GFlop/s" % (solutionGFlops) - s += "\n" - s += "};\n\n" - - # Create a solution mapper and init with the table above: - s += "// The solution master constructor here adds device to the master solution mapper\n" - s += "// The entrypoint to find a solution for this problem is through the master solution master\n" - s += "static SolutionMapper_%s solutionMapper_%s(\n" % (problemType, schedProbName) - s += " \"%s\", // schedule+problem name\n" % (schedProbName) - s += " solutionTable_%s, %u,\n" % (schedProbName, len(solutionsForSchedule)) - s += " embeddedExactTable_%s, %u,\n" % (schedProbName, len(exactLogic)) - s += " &problemType_%s);\n" % (problemType) - - s += "} // end anonymous namespace\n" - return s - - -################################################################################ -# Write Range Logic Recursive -# ptr : -# True : write logic to return the function pointer -# False : write logic to return the function name -################################################################################ -def writeExactLogic(problemType, indexOrder, - solutionsForSchedule, exactLogic, \ - solutionNames, ptr): - s = "" - s += " ProblemDims_%s pdims(" % problemType - indexChars = globalParameters["IndexChars"] - firstStrideAB = 0 if problemType["UseInitialStridesAB"] else 1 - firstStrideCD = 0 if problemType["UseInitialStridesCD"] else 1 - lastStrideD = problemType["NumIndicesC"] - lastStrideC = problemType["NumIndicesC"] - lastStrideA = len(problemType["IndexAssignmentsA"]) - lastStrideB = len(problemType["IndexAssignmentsB"]) - for i in range(firstStrideCD,lastStrideD): - if i != firstStrideCD: s += ", " - s += "strideD%u%s" % (i, indexChars[i]) - for i in range(firstStrideCD,lastStrideC): - s += ", strideC%u%s" % (i, indexChars[i]) - for i in range(firstStrideAB,lastStrideA): - s += ", strideA%u%s" % (i, \ - indexChars[problemType["IndexAssignmentsA"][i]]) - for i in range(firstStrideAB,lastStrideB): - s += ", strideB%u%s" % (i, \ - indexChars[problemType["IndexAssignmentsB"][i]]) - for i in range(0,len(indexOrder)): - s += ", size%s" % indexChars[i] - s += ");\n" - - s += " auto solutionMapper = reinterpret_cast (masterSolutionMapper_%s.mapper());\n" \ - % (problemType, problemType) - if ptr: - s += " return solutionMapper->getSolutionWithFallback(pdims,&masterSolutionMapper_%s);\n" % problemType - else: - s += " return solutionMapper->getSolutionWithFallback(pdims,&masterSolutionMapper_%s)->_info->_name;\n" % problemType - - return s - - -################################################################################ -# Write Solution Call -################################################################################ -def writeSolutionCall(solutionName, problemType): - indexChars = globalParameters["IndexChars"] - s = "" - s += "%s(" % solutionName - # solution parameters - s += " dataD, dataC, dataA, dataB, alpha" - if problemType["UseBeta"]: - s += ", beta" - s += ", offsetC, offsetA, offsetB" - firstStrideAB = firstStrideCD = 1 - if problemType["UseInitialStridesAB"]: - firstStrideAB = 0 - if problemType["UseInitialStridesCD"]: - firstStrideCD = 0 - lastStrideD = problemType["NumIndicesC"] - lastStrideC = problemType["NumIndicesC"] - lastStrideA = len(problemType["IndexAssignmentsA"]) - lastStrideB = len(problemType["IndexAssignmentsB"]) - for i in range(firstStrideCD,lastStrideD): - s += ", strideD%u%s" % (i, indexChars[i]) - for i in range(firstStrideCD,lastStrideC): - s += ", strideC%u%s" % (i, indexChars[i]) - for i in range(firstStrideAB,lastStrideA): - s += ", strideA%u%s" % (i, \ - indexChars[problemType["IndexAssignmentsA"][i]]) - for i in range(firstStrideAB,lastStrideB): - s += ", strideB%u%s" % (i, \ - indexChars[problemType["IndexAssignmentsB"][i]]) - for i in range(0, problemType["TotalIndices"]): - s += ", size%s" % indexChars[i] - s += ", stream, numInputEvents, inputEvents, outputEvent )" - return s - ############################################################################## # Min Naming / Solution and Kernel Writers ############################################################################## diff --git a/setup.py b/setup.py index 96d0f4b9e..5fa141521 100644 --- a/setup.py +++ b/setup.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2017-2022 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2017-2023 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -65,13 +65,6 @@ def readVersionFromInit(): "TensileCreateLibrary = Tensile.TensileCreateLibrary:TensileCreateLibrary", "TensileGetPath = Tensile:PrintTensileRoot", - # automatic benchmarking for rocblas - "tensile_rocblas_sgemm = Tensile.Tensile:TensileROCBLASSGEMM", - "tensile_rocblas_dgemm = Tensile.Tensile:TensileROCBLASDGEMM", - "tensile_rocblas_cgemm = Tensile.Tensile:TensileROCBLASCGEMM", - "tensile_rocblas_zgemm = Tensile.Tensile:TensileROCBLASZGEMM", - # automatically find fastest sgemm exhaustive search - "tensile_sgemm = Tensile.Tensile:TensileSGEMM5760", # Run tensile benchmark from cluster "TensileBenchmarkCluster = Tensile.TensileBenchmarkCluster:main", # Retune library logic file From 49e2c0edbb88d04c6a544761b003e50ee12803d4 Mon Sep 17 00:00:00 2001 From: Babak Poursartip Date: Tue, 5 Dec 2023 10:26:56 -0600 Subject: [PATCH 11/51] adding xf32 option to rocblas-bench input creator Co-authored-by: Babak --- .../automation/rocblas-benchInputCreator.py | 58 +++++++++++-------- 1 file changed, 33 insertions(+), 25 deletions(-) diff --git a/tuning/automation/rocblas-benchInputCreator.py b/tuning/automation/rocblas-benchInputCreator.py index 58dbc1dd6..f1e159df5 100644 --- a/tuning/automation/rocblas-benchInputCreator.py +++ b/tuning/automation/rocblas-benchInputCreator.py @@ -23,12 +23,15 @@ ################################################################################ # Generates rocblas-bench input files from the library logic files. +# Usage: +# $ python3 rocblas-benchInputCreator.py [-v] [-i ] + # creates the benchmark and verification files: -# $ python3 rocblas-benchInputCreator.py -v ../libLogics/aldebaran_Cijk_Ailk_Bjlk_BBS_BH.yaml ./ BSS_NT +# $ python3 rocblas-benchInputCreator.py -v ../libLogics ./ # creates the benchmark and verification files with hpl initialization: -# $ python3 rocblas-benchInputCreator.py -v -i hpl ../libLogics/aldebaran_Cijk_Ailk_Bjlk_BBS_BH.yaml ./ BSS_NT +# $ python3 rocblas-benchInputCreator.py -v -i hpl ../libLogics ./ # creates the benchmark file: -# $ python3 rocblas-benchInputCreator.py ../libLogics/aldebaran_Cijk_Ailk_Bjlk_BBS_BH.yaml ./ BSS_NT +# $ python3 rocblas-benchInputCreator.py ../libLogics ./ import argparse import os @@ -42,13 +45,11 @@ def parseArgs(): h = {"libLogic" : "Input library logic file", "outDir" : "Output directory for rocBLAS-bench yaml files", "verify" : "Also output verify version of yaml files", - "outfile" : "the name of output file", "initial" : "Matrix initialization: hpl, trig, int. The default is trig for non Int8 datatype, and int for Int8." } argParser.add_argument("libLogic", metavar="logic-file", type=str, help=h["libLogic"]) argParser.add_argument("outDir", metavar="output-dir", type=str, help=h["outDir"]) - argParser.add_argument("outfile", metavar="output-file", type=str, help=h["outfile"]) argParser.add_argument("--verify", "-v", action="store_true", help=h["verify"]) argParser.add_argument("--initialization", "-i", action="store", type=str, default = 'trig', help=h["initial"]) @@ -126,6 +127,9 @@ def getProblemType(problem): else: problemDict["compute_type"] = problemDict["a_type"] + if problem["F32XdlMathOp"]==9: # XF32 + problemDict["math_mode"] = 1 + return problemDict def getSizeParams(size, transA, transB): @@ -162,7 +166,7 @@ def getSizeParams(size, transA, transB): return sizeDict -def createYaml(args, problem, sizeMappings, verify): +def createYaml(args, outputfile, problem, sizeMappings, verify): bench = [] benchStrided = [] benchGeneralBatched = [] @@ -192,9 +196,7 @@ def createYaml(args, problem, sizeMappings, verify): init = {"initialization": "rand_int"} # check if the library is General Batched based on the library name - generalBatched = False - if "_GB.yaml" in os.path.split(args.libLogic)[-1]: - generalBatched = True + generalBatched = True if "_GB.yaml" in os.path.split(args.libLogic)[-1] else False # create rocBLAS-bench call for each size in logic file for (size, _) in sizeMappings: # size[0] = M, size[1] = N, size[2] = batch_count, size[3] = K, size[4] = ldc, size[5] = ldd, size[6] = lda, size[7] = ldb @@ -226,23 +228,25 @@ def createYaml(args, problem, sizeMappings, verify): benchStrided.append(params) # output file names - prefix = args.outfile - prefix += "_verify" if verify else "" + postfix = "_verify" if verify else "_bench" - benchPath = os.path.join(args.outDir, prefix + "_bench.yaml") - benchStridedPath = os.path.join(args.outDir, prefix +"_bench-strided.yaml") - benchGeneralBatchedPath = os.path.join(args.outDir, prefix +"_bench-general-batched.yaml") + benchPath = os.path.join(args.outDir, outputfile + postfix + ".yaml") + benchStridedPath = os.path.join(args.outDir, outputfile + postfix +"-strided.yaml") + benchGeneralBatchedPath = os.path.join(args.outDir, outputfile + postfix+ "-general-batched.yaml") # write output if len(bench) > 0: with open(benchPath, "w") as f: yaml.safe_dump(bench, f, default_flow_style=None, sort_keys=False, width=5000) + f.write(f"# End of {benchPath} \n") if len(benchStrided) > 0: with open(benchStridedPath, "w") as f: yaml.safe_dump(benchStrided, f, default_flow_style=None, sort_keys=False, width=5000) + f.write(f"# End of {benchStrided} \n") if len(benchGeneralBatched) > 0: with open(benchGeneralBatchedPath, "w") as f: yaml.safe_dump(benchGeneralBatched, f, default_flow_style=None, sort_keys=False, width=5000) + f.write(f"# End of {benchGeneralBatched} \n") def main(): args = parseArgs() @@ -250,20 +254,24 @@ def main(): if not (args.initialization in ['hpl', 'trig', 'int']): raise RuntimeError(f"Initialization {args.initialization} is not allowed. Choose from hpl, trig, or int.") - with open(args.libLogic) as f: - logicData = yaml.safe_load(f) + for libname in os.listdir(args.libLogic): + output = os.path.splitext(libname)[0] + print(f" working on {output}") + yamlName = os.path.join(args.libLogic,libname) + with open(yamlName) as f: + logicData = yaml.safe_load(f) - try: - os.makedirs(args.outDir) - except OSError: - pass + try: + os.makedirs(args.outDir) + except OSError: + pass - problem = logicData[4] - sizeMappings = logicData[7] + problem = logicData[4] + sizeMappings = logicData[7] - createYaml(args, problem, sizeMappings, False) - if args.verify: - createYaml(args, problem, sizeMappings, True) + createYaml(args, output, problem, sizeMappings, False) + if args.verify: + createYaml(args, output, problem, sizeMappings, True) if __name__ == "__main__": main() From 502f57d68b1445871c390fdf4ee4d214a3d503f0 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Thu, 7 Dec 2023 03:29:33 +0900 Subject: [PATCH 12/51] Add new parameters to specify global load width for A and B separately (#1831) - added new parameter GlobalLoadVectorWidthA, B (effective with GlobalReadVectorWidth=-1) - kept existing GlobalReadVectorWidth to minimize changes in existing test cases --- Tensile/Common.py | 21 +++++-- Tensile/KernelWriter.py | 18 +++--- Tensile/SolutionStructs.py | 120 +++++++++++++++++++------------------ 3 files changed, 86 insertions(+), 73 deletions(-) diff --git a/Tensile/Common.py b/Tensile/Common.py index 0aba6f5ac..b44a42abe 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -1138,9 +1138,9 @@ def getArchitectureName(gfxName): # The byte address of the last element in the packed array must fit in 2^32. # 0x0 = each workgroup works on a single batch dim. # 0x1 = pack Batch dimensions into wg0/A - works if all batch strides for B==0. - # Also must set AssertFree0ElementMultiple to >= GlobalReadVectorWidth + # Also must set AssertFree0ElementMultiple to >= GlobalLoadVectorWidthA # 0x2 = pack Batch dimensions into wg1/B - works if all batch strides for A==0 - # Also must set AssertFree1ElementMultiple to >= GlobalReadVectorWidth + # Also must set AssertFree1ElementMultiple to >= GlobalLoadVectorWidthB # 0x3 = pack batch dims into both A and B. Could support any stride for A and B. (Not supported yet) "PackBatchDims": [0,1,2], @@ -1172,14 +1172,23 @@ def getArchitectureName(gfxName): # Controls desired width (#elements) for loads from global memory -> LDS. # and eliminates the pointer unshift logic - # -1 : Set GlobalReadVectorWidth = VectorWidth + # Setting different GlobalLoadVectorWidth for A,B is now supported + # (GlobalReadVectorWidth is still valid to set the same value to both A and B) + # -1 : Set GlobalLoadVectorWidthA/B = VectorWidth # NOTE: for input bpe=32, max GRVW is 4 (to fit dwordX4) (FP32), min GRVW is 1 (dword) # bpe=16, max GRVW is 8 (to fit dwordX4) (FP16), min GRVW is 2 (dword) # bpe=8, max GRVW is 16 (to fit dwordX4) (INT8), min GRVW is 4 (dword) + # NOTE: GlobalLoadVectorWidthA/B can be auto-adjusted in SolutionStruct.py + "GlobalLoadVectorWidthA": [ -1, 1, 2, 3, 4, 6, 8, 16 ], + "GlobalLoadVectorWidthB": [ -1, 1, 2, 3, 4, 6, 8, 16 ], + + # legacy setting for global load width + # -1 : use GlobalLoadVectorWidthA, GlobalLoadVectorWidthB + # > 0 : GlobalLoadVectorWidthA=GlobalLoadVectorWidthB=GlobalReadVectorWidth "GlobalReadVectorWidth": [ -1, 1, 2, 3, 4, 6, 8, 16 ], # Controls desired width (#elements) for loads from LDS -> VGPR. - # -1 : Set LocalReadVectorWidth = VectorWidth + # -1 : Set LocalReadVectorWidth = MIInputPerThread if MatrixInstruction else VectorWidth # 1 cannot be used for half type. # used in combination with TransposeLDS=True # in TransposeLDS=1 case, use wider load to fetch elements in summation dimension from LDS @@ -1195,7 +1204,7 @@ def getArchitectureName(gfxName): # If the ThreadTile is > VectorWidth then thread0 will next operate on the 4 elements in C at (4*NumThreads) # Typically the load vector width and store vector width are directly related to the VW. # The global load width is closely related to the width of local stores so - # GlobalReadVectorWidth also controls local write width. + # GlobalLoadVectorWidthA/B also controls local write width. # Local read width also matches since VectorWidth consecutive elements must be read # Typically matching 16 bytes is good choice since the stores will be optimally coalesced with 16 bytes/WI. # -1 means use the largest vector width up to 128 bits. @@ -1411,6 +1420,8 @@ def getArchitectureName(gfxName): {"VectorWidth": [ -1 ] }, {"VectorStore": [ -1 ] }, {"StoreVectorWidth": [ -1 ] }, + {"GlobalLoadVectorWidthA": [ -1 ] }, + {"GlobalLoadVectorWidthB": [ -1 ] }, {"GlobalReadVectorWidth": [ -1 ] }, {"LocalReadVectorWidth": [ -1 ] }, {"GlobalReadCoalesceVectorA": [ True ] }, diff --git a/Tensile/KernelWriter.py b/Tensile/KernelWriter.py index 4bdc974e1..e51b22e63 100644 --- a/Tensile/KernelWriter.py +++ b/Tensile/KernelWriter.py @@ -3681,7 +3681,7 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): # - BufferLoad = True # - SuppressNoLoadLoop = False # - MatrixInstruction + MatrixInstK > 1 - # - global read width for TailLoop decided by assert is multiple of GlobalReadVectorWidth + # - global read width for TailLoop decided by assert is multiple of GlobalLoadVectorWidthA/B # (this is necessary to use prefetch global read fot tail loop without out of range access at the edge) # - GlobalSplitU = 1 # GSU>1 case, remaining K is distributed unevenly and does not work with tailLoop in noLoadLoop @@ -4009,25 +4009,25 @@ def isPowerOf2(val): if kernel["GlobalReadCoalesceVectorA"]: # read vectors, write vectors self.writeUnrollDimComponentsA = False # Scalar if kernel["LocalDotLayout"]>1: - self.writeTileDimComponentsA = kernel["GlobalReadVectorWidth"] > 1 # Components + self.writeTileDimComponentsA = kernel["GlobalLoadVectorWidthA"] > 1 # Components writeCoal = False else: self.writeTileDimComponentsA = False # Vector writeCoal = True else: # read components, write components self.writeTileDimComponentsA = False # Scalar - self.writeUnrollDimComponentsA = kernel["GlobalReadVectorWidth"] > 1 # Components + self.writeUnrollDimComponentsA = kernel["GlobalLoadVectorWidthA"] > 1 # Components writeCoal = False else: # TN yes transpose self.numWritesCoalA = kernel["NumLoadsPerpendicularA"] if kernel["GlobalReadCoalesceVectorA"]: # read vector, write components self.writeUnrollDimComponentsA = False # Scalar if kernel["LocalDotLayout"]>1: - self.writeTileDimComponentsA = kernel["GlobalReadVectorWidth"] > 1 # Components + self.writeTileDimComponentsA = kernel["GlobalLoadVectorWidthA"] > 1 # Components # LDS writes with LDL>1 will never be coalesced writeCoal = False else: - self.writeTileDimComponentsA = kernel["GlobalReadVectorWidth"] > 1 # Components + self.writeTileDimComponentsA = kernel["GlobalLoadVectorWidthA"] > 1 # Components writeCoal = False else: # read components, write vectors self.writeTileDimComponentsA = False # Vector @@ -4118,14 +4118,14 @@ def isPowerOf2(val): if kernel["GlobalReadCoalesceVectorB"]: self.writeUnrollDimComponentsB = False # Vector if kernel["LocalDotLayout"]>1: - self.writeTileDimComponentsB = kernel["GlobalReadVectorWidth"] > 1 # Components + self.writeTileDimComponentsB = kernel["GlobalLoadVectorWidthB"] > 1 # Components writeCoal = False else: self.writeTileDimComponentsB = False # Vector writeCoal = True else: self.writeTileDimComponentsB = False # Scalar - self.writeUnrollDimComponentsB = kernel["GlobalReadVectorWidth"] > 1 # Components + self.writeUnrollDimComponentsB = kernel["GlobalLoadVectorWidthB"] > 1 # Components # NEW self.numWritesCoalVecCompB = 1 self.numWritesPerpVecCompB = vwb @@ -4134,11 +4134,11 @@ def isPowerOf2(val): if kernel["GlobalReadCoalesceVectorB"]: self.writeUnrollDimComponentsB = False if kernel["LocalDotLayout"]>1: - self.writeTileDimComponentsB = kernel["GlobalReadVectorWidth"] > 1 # Components + self.writeTileDimComponentsB = kernel["GlobalLoadVectorWidthB"] > 1 # Components # LDS writes with LDL>1 will never be coalesced writeCoal = False else: - self.writeTileDimComponentsB = kernel["GlobalReadVectorWidth"] > 1 # Components + self.writeTileDimComponentsB = kernel["GlobalLoadVectorWidthB"] > 1 # Components writeCoal = False else: self.writeTileDimComponentsB = False # Vector diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index 0239d23ff..b1699ee2f 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -2026,8 +2026,8 @@ def setGlobalLoadVectorWidth(state, tc, totalElements, grvw): % (pv, totalElements, numThreadGrvw)) validDepthU = False if grvw < 1 or grvw % pv != 0: - reject(None, "GlobalReadVectorWidth %u %% pv %u != 0" \ - % (grvw, pv)) + reject(None, "GlobalLoadVectorWidth%s %u %% pv %u != 0" \ + % (tc, grvw, pv)) validDepthU = False grvw = grvw//pv numThreadGrvw = numThreadGrvw//pv @@ -2148,7 +2148,7 @@ def setGlobalLoadTileDimClassic(state, tc, numLoads, totalVectorsCoalesced, tota # state[NumLoadsPerpendicular*] # state[LSC*] # state[LSP*] - # state[GlobalReadVectorWidth] + # state[GlobalLoadVectorWidthA/B] # # LSC and LSP define the shape of the PerLoadTile, measured in elements. # LSC*LSP is the elements loaded by a single instruction across all @@ -2187,7 +2187,7 @@ def setGlobalLoadTileDimClassic(state, tc, numLoads, totalVectorsCoalesced, tota # The KernelWriterAssembly will modify the LWO for the last load. This allows # flexibility in the unroll factors for example. @staticmethod - def setGlobalLoadTileDimFractional(state, tc, depthU): + def setGlobalLoadTileDimFractional(state, tc, depthU, glvwOrig): assert(depthU > 0) dbFract = 0 @@ -2205,13 +2205,13 @@ def setGlobalLoadTileDimFractional(state, tc, depthU): % (tc, state["MacroTile0"], state["MacroTile1"], depthU, \ parDim, perpDim, \ state["WorkGroup"][0], state["WorkGroup"][1], state["LocalSplitU"], \ - state["NumThreads"], state["GlobalReadVectorWidth"])) + state["NumThreads"], glvwOrig)) # Try to find a GRVW which is smaller than the LSC and also does not force # the LSC to wrap - both of these conditions can be tested with lsc % grvw ==0. # Each iteration divides GRWV by 2 which provides finer granularity # and a possible opportunity to handle the lsc - grvw = state["GlobalReadVectorWidth"] + grvw = glvwOrig minGrvw = 2 if state["ProblemType"]["DataType"].isHalf() and \ globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"] else 1 # TODO- check this for int8 and fractional load @@ -2268,15 +2268,15 @@ def setGlobalLoadTileDimFractional(state, tc, depthU): if bestVw == -1: if dbFract: - print ("reject fractional - no acceptable tile dim? GlobalReadVectorWidth", \ - state["GlobalReadVectorWidth"]) + print ("reject fractional - no acceptable tile dim? GlobalLoadVectorWidthA/B", \ + glvwOrig) return False # could not find a solution, perhaps only possible for half ? state["GlobalLoadVectorWidth%s"%tc] = bestVw - if bestVw != state["GlobalReadVectorWidth"]: + if bestVw != glvwOrig: if dbFract: print(" reducing GlobalLoadVectorWidth%s from %u to %u" \ - % (tc, state["GlobalReadVectorWidth"], bestVw)) + % (tc, glvwOrig, bestVw)) # How many loads per threads in each dimension. # threads which are outside the global read tile bounds will be clipped @@ -2507,9 +2507,9 @@ def isDirectToVgprDoable(state, tc): reject(state, "DirectToVgpr%c does not supports ExpandPointerSwap = False"%(tc)) return False - # Does not work with TLU + VectorWidth != GlobalReadVectorWidth (VW = 2 + GRVW = 1 or VW = 1 + GRVW = 2 does not work) + # Does not work with TLU + VectorWidth != GlobalLoadVectorWidth (VW = 2 + GRVW = 1 or VW = 1 + GRVW = 2 does not work) if state["ProblemType"]["TLU%c"%tc] and state["VectorWidth"] != state["GlobalLoadVectorWidth%c"%tc]: - reject(state, "DirectToVgpr%c does not supports TLU + VectorWidth(=%u) != GlobalReadVectorWidth%c(%u)"%(tc, state["VectorWidth"], tc, state["GlobalLoadVectorWidth%c"%tc])) + reject(state, "DirectToVgpr%c does not supports TLU + VectorWidth(=%u) != GlobalLoadVectorWidth%c(%u)"%(tc, state["VectorWidth"], tc, state["GlobalLoadVectorWidth%c"%tc])) return False # Does not work with FractionalLoad and (not TLU) @@ -2520,7 +2520,7 @@ def isDirectToVgprDoable(state, tc): # Does not work with TLU=False and NumLoadsCoalesced != DepthU//(MatrixInstK*GRVW*LSU//MIInputPerThread) if (not state["ProblemType"]["TLU%c"%tc]) and \ state["NumLoadsCoalesced%c"%tc] != state["DepthU"] // (state["MatrixInstK"] * state["GlobalLoadVectorWidth%c"%tc] * state["LocalSplitU"] // state["MIInputPerThread"]): - reject(state, "DirectToVgpr%c does not supports TLU=False and NumLoadsCoalesced%c != DepthU//(MatrixInstK*GlobalReadVectorWidth*LocalSplitU//MIInputPerThread(=%u))"%(tc, tc, state["MIInputPerThread"])) + reject(state, "DirectToVgpr%c does not supports TLU=False and NumLoadsCoalesced%c != DepthU//(MatrixInstK*GlobalLoadVectorWidth*LocalSplitU//MIInputPerThread(=%u))"%(tc, tc, state["MIInputPerThread"])) return False # TLU=False case, need GlobalLoadVectorWidth == LocalReadVectorWidth @@ -3285,9 +3285,19 @@ def assignDerivedParameters(state): #if state["KernelLanguage"] == "Assembly" and state["PackSummationDims"]: # reject(state, "PackSummationDims does not yet support assembly") - # Default GlobalReadVectorWidth - if state["GlobalReadVectorWidth"] == -1: - state["GlobalReadVectorWidth"] = state["VectorWidth"] + # Use GlobalReadVectorWidth if it is not -1 + if state["GlobalReadVectorWidth"] != -1: + state["GlobalLoadVectorWidthA"] = state["GlobalReadVectorWidth"] + state["GlobalLoadVectorWidthB"] = state["GlobalReadVectorWidth"] + + # Default GlobalLoadVectorWidthA, B + for tc in ('A','B'): + if state["GlobalLoadVectorWidth%s"%tc] == -1: + state["GlobalLoadVectorWidth%s"%tc] = state["VectorWidth"] + # reject - GLVWA/B too big + if (state["GlobalLoadVectorWidth%s"%tc] * state["ProblemType"]["DataType"].numBytes()) > 16: + reject(state, "GlobalLoadVectorWidth%s * DataType.numBytes() > 16"%tc) + return # Default GlobalStoreVectorWidth if state["StoreVectorWidth"] == -1: @@ -3316,11 +3326,6 @@ def assignDerivedParameters(state): reject(state, "VW * DataType.numBytes() > 16") return - # reject - GRVW too big - if (state["GlobalReadVectorWidth"] * state["ProblemType"]["DataType"].numBytes()) > 16: - reject(state, "GRVW * DataType.numBytes() > 16") - return - # LocalSplitU too large? numElementsPerWorkGroup = state["MacroTile0"]*state["MacroTile1"] @@ -3491,11 +3496,13 @@ def assignDerivedParameters(state): ######################################## # Search DepthU # Inputs: - # - depthU, userDepthU, state["LocalSplitU"], state["InnerUnroll"], state["MacroTile0/1"], state["GlobalReadVectorWidth"] + # - depthU, userDepthU, state["LocalSplitU"], state["InnerUnroll"], state["MacroTile0/1"], state["GlobalLoadVectorWidthA/B"] # - state["MatrixInstK"], ... # Outputs: # - totalVectorsCoalescedA, totalVectorsCoalescedB, totalElementsPerpA, totalElementsPerpB, state["DepthU"] ####################################### + GlobalLoadVectorWidthAorig = state["GlobalLoadVectorWidthA"] # keep original value + GlobalLoadVectorWidthBorig = state["GlobalLoadVectorWidthB"] # keep original value while True: # exit criteria at end validDepthU = True # peek LoopIters @@ -3536,38 +3543,38 @@ def assignDerivedParameters(state): totalElementsB = totalElementsCoalescedB * totalElementsPerpB if state["FractionalLoad"]: - if not Solution.setGlobalLoadTileDimFractional(state, "A", depthU): + if not Solution.setGlobalLoadTileDimFractional(state, "A", depthU, GlobalLoadVectorWidthAorig): validDepthU = False - if not Solution.setGlobalLoadTileDimFractional(state, "B", depthU): + if not Solution.setGlobalLoadTileDimFractional(state, "B", depthU, GlobalLoadVectorWidthBorig): validDepthU = False else: - GlobalReadVectorWidth = state["GlobalReadVectorWidth"] + GlobalLoadVectorWidthA = GlobalLoadVectorWidthAorig if state["DirectToVgprA"]: if not state["SourceSwap"]: - GlobalReadVectorWidth = 1 # adjust GlobalReadVectorWidth to 1 in DirectToVgpr case (except for DirectToVgprA + SourceSwap) - elif state["DirectToLdsA"] and (bpeAB * GlobalReadVectorWidth) > 4: + GlobalLoadVectorWidthA = 1 # adjust GlobalLoadVectorWidth to 1 in DirectToVgpr case (except for DirectToVgprA + SourceSwap) + elif state["DirectToLdsA"] and (bpeAB * GlobalLoadVectorWidthA) > 4: # bpe * grvw must be <= 4 for DirectToLds (lds flag only for <= 32bit load) - GlobalReadVectorWidth = 4 / bpeAB + GlobalLoadVectorWidthA = 4 / bpeAB # use float only for <1. Otherwise, convert to int - if GlobalReadVectorWidth >= 1: - GlobalReadVectorWidth = int(GlobalReadVectorWidth) - if not Solution.setGlobalLoadVectorWidth(state, "A", totalElementsA, GlobalReadVectorWidth): + if GlobalLoadVectorWidthA >= 1: + GlobalLoadVectorWidthA = int(GlobalLoadVectorWidthA) + if not Solution.setGlobalLoadVectorWidth(state, "A", totalElementsA, GlobalLoadVectorWidthA): validDepthU = False - GlobalReadVectorWidth = state["GlobalReadVectorWidth"] - if (not state["DirectToVgprB"]) and state["DirectToLdsB"] and (bpeAB * GlobalReadVectorWidth) > 4: + GlobalLoadVectorWidthB = GlobalLoadVectorWidthBorig + if (not state["DirectToVgprB"]) and state["DirectToLdsB"] and (bpeAB * GlobalLoadVectorWidthB) > 4: # bpe * grvw must be <= 4 for DirectToLds - GlobalReadVectorWidth = 4 / bpeAB + GlobalLoadVectorWidthB = 4 / bpeAB # use float only for <1. Otherwise, convert to int - if GlobalReadVectorWidth >= 1: - GlobalReadVectorWidth = int(GlobalReadVectorWidth) - if not Solution.setGlobalLoadVectorWidth(state, "B", totalElementsB, GlobalReadVectorWidth): + if GlobalLoadVectorWidthB >= 1: + GlobalLoadVectorWidthB = int(GlobalLoadVectorWidthB) + if not Solution.setGlobalLoadVectorWidth(state, "B", totalElementsB, GlobalLoadVectorWidthB): validDepthU = False if validDepthU and state["KernelLanguage"] == "Assembly" \ and (state["ProblemType"]["DataType"].isHalf() \ or state["ProblemType"]["DataType"].isBFloat16()): if globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"]: - if state["GlobalLoadVectorWidthA"] == 1 or state["GlobalLoadVectorWidthB"] == 1: + if state["GlobalLoadVectorWidthA"] <= 1 or state["GlobalLoadVectorWidthB"] <= 1: reject(state, "HalfEcc requires GLVWA > 1") # TODO- Need this restrict ? @@ -3579,17 +3586,13 @@ def assignDerivedParameters(state): reject(state, "Int8 requires GLVWB >= 4, current is %u"%state["GlobalLoadVectorWidthB"]) - # Now convert elements to vectors based on GlobalReadVectorWidth - GlobalLoadVectorWidthA = state["GlobalLoadVectorWidthA"] - GlobalLoadVectorWidthB = state["GlobalLoadVectorWidthB"] - if GlobalLoadVectorWidthA == 0: - GlobalLoadVectorWidthA = GlobalReadVectorWidth - if GlobalLoadVectorWidthB == 0: - GlobalLoadVectorWidthB = GlobalReadVectorWidth - totalVectorsCoalescedA = totalElementsCoalescedA // GlobalLoadVectorWidthA - totalVectorsCoalescedB = totalElementsCoalescedB // GlobalLoadVectorWidthB - totalVectorsA = totalElementsA // GlobalLoadVectorWidthA - totalVectorsB = totalElementsB // GlobalLoadVectorWidthB + # Now convert elements to vectors based on GlobalLoadVectorWidth + GlobalLoadVectorWidthA = GlobalLoadVectorWidthAorig if state["GlobalLoadVectorWidthA"] == 0 else state["GlobalLoadVectorWidthA"] + GlobalLoadVectorWidthB = GlobalLoadVectorWidthBorig if state["GlobalLoadVectorWidthB"] == 0 else state["GlobalLoadVectorWidthB"] + totalVectorsCoalescedA = int(totalElementsCoalescedA / GlobalLoadVectorWidthA) + totalVectorsCoalescedB = int(totalElementsCoalescedB / GlobalLoadVectorWidthB) + totalVectorsA = int(totalElementsA / GlobalLoadVectorWidthA) + totalVectorsB = int(totalElementsB / GlobalLoadVectorWidthB) if 0: print("info:", pvar(state, "NumThreads"), pvar(state, "DepthU"), pvar(state, "DepthULdsDivisor"), @@ -3614,14 +3617,12 @@ def assignDerivedParameters(state): or state["GlobalLoadVectorWidthB"] != 1: validDepthU = False elif userDepthU == -2: - if max( state["GlobalLoadVectorWidthA"], \ - state["GlobalLoadVectorWidthB"]) \ - < state["GlobalReadVectorWidth"]: + if state["GlobalLoadVectorWidthA"] < GlobalLoadVectorWidthAorig and \ + state["GlobalLoadVectorWidthB"] < GlobalLoadVectorWidthBorig: validDepthU = False elif userDepthU <= -3: - if min( state["GlobalLoadVectorWidthA"], \ - state["GlobalLoadVectorWidthB"]) \ - < state["GlobalReadVectorWidth"]: + if state["GlobalLoadVectorWidthA"] < GlobalLoadVectorWidthAorig or \ + state["GlobalLoadVectorWidthB"] < GlobalLoadVectorWidthBorig: validDepthU = False if validDepthU: @@ -3906,7 +3907,7 @@ def assignDerivedParameters(state): rejectMessage += "\n" + "To enable NoTailLoop, " rejectMessage += "\n" + " - AssertSummationElementMultiple/GlobalSplitU) is multiple of DepthU or" rejectMessage += "\n" + " - BufferLoad and MatrixInstruction + MatrixInstK > 1 and" - rejectMessage += "\n" + " (global read width for TailLoop decided by assert is multiple of GlobalReadVectorWidth) and" + rejectMessage += "\n" + " (global read width for TailLoop decided by assert is multiple of GlobalLoadVectorWidth) and" rejectMessage += "\n" + " (StaggerU = 0 or NT(+BufferLoad))" reject(state, rejectMessage) return @@ -4384,9 +4385,10 @@ def assignDerivedParameters(state): reject(state, "DepthULdsDivisor > 1: Only works with TN problem layout and UnrollMajorLDS") if state["PrefetchGlobalRead"]==1 and state["PrefetchLocalRead"]==0: reject(state, "PGR1 + PLR0 in SplitLDS requires double G2L buffer which is yet to be implemented") - if state["ProblemType"]["DataType"].numRegisters()*state["GlobalReadVectorWidth"] < state["DepthULdsDivisor"]: - reject(state, "SplitLDS requires wider GlobalReadVectorWidth; needs RegisterPerElem (%f) * GRVW (%u) >= DepthULdsDivisor (%u)"% - (state["ProblemType"]["DataType"].numRegisters(),state["GlobalReadVectorWidth"],state["DepthULdsDivisor"])) + for tc in ('A', 'B'): + if state["ProblemType"]["DataType"].numRegisters()*state["GlobalLoadVectorWidth%s"%tc] < state["DepthULdsDivisor"]: + reject(state, "SplitLDS requires wider GlobalLoadVectorWidth%s; needs RegisterPerElem (%f) * GLVW%s (%u) >= DepthULdsDivisor (%u)"% + (tc, state["ProblemType"]["DataType"].numRegisters(),tc,state["GlobalLoadVectorWidth%s"%tc],state["DepthULdsDivisor"])) if state["GlobalReadPerMfma"] > 1 and state["PrefetchGlobalRead"] == 2: reject(state, "GlobalReadPerMfma need to be 1 if PGR2") From d76408a4a939ebc8187145162247b333e9ee47a9 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Thu, 7 Dec 2023 03:52:31 +0900 Subject: [PATCH 13/51] Re-enable negative values for WorkGroupMapping (asm kernel only) (#1838) --- Tensile/Common.py | 6 +- Tensile/KernelWriterAssembly.py | 59 ++++++++++--------- Tensile/SolutionStructs.py | 8 ++- .../Source/lib/source/ContractionSolution.cpp | 14 ++++- Tensile/Tests/pre_checkin/mfma/sgemm_asm.yaml | 4 +- 5 files changed, 55 insertions(+), 36 deletions(-) diff --git a/Tensile/Common.py b/Tensile/Common.py index b44a42abe..26e0795d6 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -911,7 +911,9 @@ def getArchitectureName(gfxName): # For Block Mapping type: # 0 : Use hardware-assigned wg number with no remapping. # N : WG block width. "Wrap" to a new wg1 "row" assignment after N WGs assigned in that row. - # < 0 : Swaps the position of wg0 and wg1. Does not change NumWorkGroups* or ProblemNumWorkGroups*. No longer supported. + # < 0 : Swaps the position of wg0 and wg1. Does not change NumWorkGroups* or ProblemNumWorkGroups*. + # Can be effective in M>N case. + # -1 is same as 1 # Tensor C always mapped with first free coord as fastest moving # (Elements in this dimension are sequential in memory. # @@ -933,7 +935,7 @@ def getArchitectureName(gfxName): # # Formula for wgSerial: # wgSerial = wg0 + (wg1 % WorkGroupMapping) * nwg0 - "WorkGroupMapping": list(range(0,1024+1)), # change a workgroup's id so that the all the workgroups on the gpu at a time are hitting L2 cache the best + "WorkGroupMapping": list(range(-1024,1024+1)), # change a workgroup's id so that the all the workgroups on the gpu at a time are hitting L2 cache the best "WorkGroupMappingType": ["B", "Z"], # Blocking, Z-order (not any faster than blocking, especially for the arithmetic it requires) "MaxOccupancy": list(range(1, 40+1)), # wg / CU; if cache thrashing is hurting performance, this allocates extra lds to artificially limit occupancy "WorkGroup": validWorkGroups, # ( wg0 x wg1 x LocalSplitU ) dimensions of the workgroup which will operate on a tile and share lds diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 0dcd67d3d..cab8ddb7b 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -1738,12 +1738,14 @@ def initKernel(self, kernel, tPA, tPB ): self.defineSgpr("KernArgAddress", self.rpga) assert(self.sgprs["KernArgAddress"] == 0) # kernarg is passed to kernel as SGPR0 - if kernel["WorkGroupMapping"]>=0 : - self.defineSgpr("WorkGroup0", 1) - self.defineSgpr("WorkGroup1", 1) - else: - self.defineSgpr("WorkGroup1", 1) - self.defineSgpr("WorkGroup0", 1) + #if kernel["WorkGroupMapping"]>=0 : + # self.defineSgpr("WorkGroup0", 1) + # self.defineSgpr("WorkGroup1", 1) + #else: + # self.defineSgpr("WorkGroup1", 1) + # self.defineSgpr("WorkGroup0", 1) + self.defineSgpr("WorkGroup0", 1) + self.defineSgpr("WorkGroup1", 1) wg=2 @@ -3932,7 +3934,7 @@ def graWorkGroup(self, kernel, isPap): ######################################## # Blocked rows or columns absWgm = abs(kernel["WorkGroupMapping"]) - if kernel["WorkGroupMappingType"] == "B" and abs(kernel["WorkGroupMapping"]) > 1: + if kernel["WorkGroupMappingType"] == "B" and kernel["WorkGroupMapping"] > 1: smallNumMagicShift = 31 magicNumberWgm = ((1<=0 : + firstNum = "0" + secondNum = "1" + else: + firstNum = "1" + secondNum = "0" + firstWg = "WorkGroup%s"%firstNum + secondWg = "WorkGroup%s"%secondNum + # note this overwrites blockId2+1 - kStr += self.sMagicDiv(kernel, dest=blockId2, dividend=sgpr("WorkGroup1"), \ + kStr += self.sMagicDiv(kernel, dest=blockId2, dividend=sgpr(secondWg), \ magicNumber=sgpr(wgmDivisorMagicNumber), magicShift=smallNumMagicShift) kStr += inst("s_mul_i32", sgpr(wgSerial2), sgpr(blockId2), absWgm, "quotient * non-magic divisor") - kStr += inst("s_sub_u32", sgpr(wgSerial2), sgpr("WorkGroup1"), sgpr(wgSerial2), "WorkGroup1=remainder") - kStr += inst("s_mul_i32", sgpr(wgSerial2), sgpr(wgSerial2), sgpr("NumWorkGroups0"), "(wg1 % WGM)*nwg0") - kStr += inst("s_add_u32", sgpr(wgSerial2), sgpr(wgSerial2), sgpr("WorkGroup0"), "wgSerial = wg0 + (wg1 % WGM)*nwg0") + kStr += inst("s_sub_u32", sgpr(wgSerial2), sgpr(secondWg), sgpr(wgSerial2), "%s=remainder"%secondWg) + kStr += inst("s_mul_i32", sgpr(wgSerial2), sgpr(wgSerial2), sgpr("NumWorkGroups%s"%firstNum), "(wg%s %% WGM)*nwg%s"%(secondNum, firstNum)) + kStr += inst("s_add_u32", sgpr(wgSerial2), sgpr(wgSerial2), sgpr(firstWg), "wgSerial = wg%s + (wg1 %% WGM)*nwg%s"%(firstNum, secondNum)) kStr += inst("s_cmp_ge_u32", sgpr(blockId2), sgpr("NumFullBlocks"), "blockId >= numFullBlocks ?") # reuse wgmDivisorMagicNumber - may override with remainder here: kStr += inst("s_cmov_b32", sgpr(wgmDivisorMagicNumber), sgpr("MagicNumberWgmRemainder1"), "") kStr += inst("s_cselect_b32", sgpr(wgmDivisor), sgpr("WgmRemainder1"), absWgm, "") - if kernel["WorkGroupMapping"]>=0 : - firstWg = "WorkGroup0" - secondWg = "WorkGroup1" - else: - firstWg = "WorkGroup1" - secondWg = "WorkGroup0" - - assert(self.sgprs[firstWg] & 0x1 == 0) # must be even and ... - assert(self.sgprs[firstWg]+1 == self.sgprs[secondWg] ) # must be consecutive (for magic div below) - kStr += self.sMagicDiv(kernel, dest=self.sgprs[firstWg], dividend=sgpr(wgSerial2), \ + #assert(self.sgprs[firstWg] & 0x1 == 0) # must be even and ... + #assert(self.sgprs[firstWg]+1 == self.sgprs[secondWg] ) # must be consecutive (for magic div below) + kStr += self.sMagicDiv(kernel, dest=self.sgprs["WorkGroup0"], dividend=sgpr(wgSerial2), \ magicNumber=sgpr(wgmDivisorMagicNumber), magicShift=smallNumMagicShift) if kernel["WorkGroupMapping"]<0 : - kStr += inst("s_mov_b32", sgpr("WorkGroup0"), sgpr(firstWg), "") - kStr += inst("s_mul_i32", sgpr("WorkGroup1"), sgpr("WorkGroup0"), sgpr(wgmDivisor), "quotient * non-magic divisor") - kStr += inst("s_sub_u32", sgpr("WorkGroup1"), sgpr(wgSerial2), sgpr("WorkGroup1"), "WorkGroup1=remainder") + kStr += inst("s_mov_b32", sgpr(firstWg), sgpr("WorkGroup0"), "mov for WGM<0") + kStr += inst("s_mul_i32", sgpr(secondWg), sgpr(firstWg), sgpr(wgmDivisor), "quotient * non-magic divisor") + kStr += inst("s_sub_u32", sgpr(secondWg), sgpr(wgSerial2), sgpr(secondWg), "%s=remainder"%secondWg) - kStr += inst("s_mul_i32", sgpr(blockId2), sgpr(blockId2), \ - abs(kernel["WorkGroupMapping"]), "blockId * WGM") + kStr += inst("s_mul_i32", sgpr(blockId2), sgpr(blockId2), absWgm, "blockId * WGM") kStr += inst("s_add_u32", sgpr(secondWg), sgpr(secondWg), \ - sgpr(blockId2), "wg1 += blockId * WGM") - + sgpr(blockId2), "wg%s += blockId * WGM"%secondNum) + self.sgprPool.checkIn(tmpSgpr) return kStr diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index b1699ee2f..5a51e65e1 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -3077,7 +3077,13 @@ def assignDerivedParameters(state): state["LocalWriteUseSgprA"] = False state["LocalWriteUseSgprB"] = False - state["WorkGroupMapping" ] = abs(state["WorkGroupMapping"]) + if state["KernelLanguage"] != "Assembly" or state["WorkGroupMappingType"] == "Z": + # WGM < 0 is only for Asm + WorkGroupMappingType==B + # convert to > 0 + state["WorkGroupMapping" ] = abs(state["WorkGroupMapping"]) + if state["WorkGroupMapping" ] == -1: + # -1 code is same as 1. Convert to 1. + state["WorkGroupMapping" ] = 1 # avoid bug somehow related to GlobalSplitU + Persistent # avoid bug related to WGM<0 diff --git a/Tensile/Source/lib/source/ContractionSolution.cpp b/Tensile/Source/lib/source/ContractionSolution.cpp index 2ed74c37c..d0e513534 100644 --- a/Tensile/Source/lib/source/ContractionSolution.cpp +++ b/Tensile/Source/lib/source/ContractionSolution.cpp @@ -260,7 +260,7 @@ namespace Tensile TypedInputs const& inputs, Hardware const& hardware) const { - TENSILE_ASSERT_EXC(sizeMapping.workGroupMapping >= 0); + //TENSILE_ASSERT_EXC(sizeMapping.workGroupMapping >= 0); TensorDescriptor const& a = problem.a(); TensorDescriptor const& b = problem.b(); @@ -660,8 +660,16 @@ namespace Tensile if(sizeMapping.workGroupMapping != 0) { - numFullBlocks = problemNumGroupTiles1 / sizeMapping.workGroupMapping; - wgmRemainder1 = problemNumGroupTiles1 % sizeMapping.workGroupMapping; + if(sizeMapping.workGroupMapping >= 0) + { + numFullBlocks = problemNumGroupTiles1 / sizeMapping.workGroupMapping; + wgmRemainder1 = problemNumGroupTiles1 % sizeMapping.workGroupMapping; + } + else + { + numFullBlocks = problemNumGroupTiles0 / (-sizeMapping.workGroupMapping); + wgmRemainder1 = problemNumGroupTiles0 % (-sizeMapping.workGroupMapping); + } if(wgmRemainder1 == 0) wgmRemainder1 = sizeMapping.workGroupMapping; magicNumberWgmRemainder1 = smallMagicNumber(wgmRemainder1); diff --git a/Tensile/Tests/pre_checkin/mfma/sgemm_asm.yaml b/Tensile/Tests/pre_checkin/mfma/sgemm_asm.yaml index d982fb22d..4fd7ad63f 100644 --- a/Tensile/Tests/pre_checkin/mfma/sgemm_asm.yaml +++ b/Tensile/Tests/pre_checkin/mfma/sgemm_asm.yaml @@ -639,7 +639,7 @@ BenchmarkProblems: - [ 16, 16, 1 ] - [ 32, 8, 1 ] - [ 64, 4, 1 ] - - WorkGroupMapping: [8] + - WorkGroupMapping: [-8] # for negative WGM test - GlobalSplitU: [1] - DepthU: [ 8 ] - VectorWidth: [1] @@ -669,7 +669,7 @@ BenchmarkProblems: - [ 8, 32, 1 ] - [ 16, 16, 1 ] - [ 32, 8, 1 ] - - WorkGroupMapping: [8] + - WorkGroupMapping: [-4] # for negative WGM test - GlobalSplitU: [1] - DepthU: [ 16 ] - VectorWidth: [1] From 461dad8a32981689cf96f4d2a330d1bf6fb7e688 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Thu, 7 Dec 2023 04:13:05 +0900 Subject: [PATCH 14/51] Fix an error with DisableKernelPieces + 32bit ShadowLimit (#1839) --- Tensile/KernelWriterAssembly.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index cab8ddb7b..46b5608bf 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -5062,7 +5062,7 @@ def computeLoadSrd(self, kernel, tP, tc, indices, bpe, isPap): # invalid global read for performance evaluation only if self.enable["InvalidGlobalRead%s"%tc]: kStr += inst("s_mov_b32", sgpr("Srd%s+2"%tc), hex(0), "set out-of-bound addr for performance evaluation only") - if noShadowLimitCodeInLoop == False: + if noShadowLimitCodeInLoop == False and self.use64bShadowLimit: kStr += inst("s_mov_b32", sgpr("ShadowLimit%s+1"%tc), hex(0xffffffff), "set out-of-bound addr for performance evaluation only") return kStr From 0d942a6a8bfa8557171716dbcc1236adc806c9c5 Mon Sep 17 00:00:00 2001 From: Torre Zuk <42548444+TorreZuk@users.noreply.github.com> Date: Wed, 6 Dec 2023 13:14:49 -0700 Subject: [PATCH 15/51] another vcpkg version package name fix (#1836) * more vcpkg package options --------- Co-authored-by: Zuk --- Tensile/Source/lib/CMakeLists.txt | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/Tensile/Source/lib/CMakeLists.txt b/Tensile/Source/lib/CMakeLists.txt index d3f4b697f..3fa647d6e 100644 --- a/Tensile/Source/lib/CMakeLists.txt +++ b/Tensile/Source/lib/CMakeLists.txt @@ -98,13 +98,15 @@ if(TENSILE_USE_LLVM OR TENSILE_USE_MSGPACK) endif() if(TENSILE_USE_MSGPACK) - find_package(msgpack REQUIRED NAMES msgpack msgpack-c) + find_package(msgpack REQUIRED NAMES msgpack msgpack-cxx msgpack-c) target_compile_definitions(TensileHost PUBLIC -DTENSILE_MSGPACK=1) if(TARGET msgpackc-cxx) get_target_property(msgpack_inc msgpackc-cxx INTERFACE_INCLUDE_DIRECTORIES) elseif(TARGET msgpackc) get_target_property(msgpack_inc msgpackc INTERFACE_INCLUDE_DIRECTORIES) + elseif(TARGET msgpack-cxx) + get_target_property(msgpack_inc msgpack-cxx INTERFACE_INCLUDE_DIRECTORIES) endif() if(DEFINED msgpack_inc) From 1dd1f8532ced08723794ce0baf37bbe8850ac561 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Thu, 7 Dec 2023 10:13:37 -0700 Subject: [PATCH 16/51] Fix LLVM crash issue (#1840) --- .jenkins/common.groovy | 3 +-- .jenkins/extended.groovy | 2 +- Tensile/TensileCreateLibrary.py | 6 ++++-- Tensile/cmake/TensileConfig.cmake | 4 ++-- 4 files changed, 8 insertions(+), 7 deletions(-) diff --git a/.jenkins/common.groovy b/.jenkins/common.groovy index 8ca2bb7e6..96561b377 100644 --- a/.jenkins/common.groovy +++ b/.jenkins/common.groovy @@ -35,7 +35,6 @@ def runCompileCommand(platform, project, jobName, boolean debug=false) // avoid bug causing long build times of certain files. String buildType = 'Release' // debug ? 'Debug' : 'RelWithDebInfo' String parallelJobs = "export HIPCC_COMPILE_FLAGS_APPEND='-O3 -Wno-format-nonliteral -parallel-jobs=4'" - String buildThreads = '16' // if hipcc is used may be multiplied by parallel-jobs // comment @@ -63,7 +62,7 @@ def runCompileCommand(platform, project, jobName, boolean debug=false) pushd build export PATH=/opt/rocm/bin:\$PATH - cmake -DCMAKE_BUILD_TYPE=${buildType} -DCMAKE_CXX_COMPILER=${compiler} -DTensile_CPU_THREADS=${buildThreads} -DTensile_ROOT=\$(pwd)/../Tensile ../HostLibraryTests + cmake -DCMAKE_BUILD_TYPE=${buildType} -DCMAKE_CXX_COMPILER=${compiler} -DTensile_ROOT=\$(pwd)/../Tensile ../HostLibraryTests NPROC_BUILD=16 if [ `nproc` -lt 16 ] then diff --git a/.jenkins/extended.groovy b/.jenkins/extended.groovy index 84a944414..44ad373be 100644 --- a/.jenkins/extended.groovy +++ b/.jenkins/extended.groovy @@ -45,7 +45,7 @@ def runCI = boolean formatCheck = false - prj.timeout.test = 720 + prj.timeout.test = 600 prj.defaults.ccache = false def commonGroovy diff --git a/Tensile/TensileCreateLibrary.py b/Tensile/TensileCreateLibrary.py index f41714bcd..dae1d0502 100644 --- a/Tensile/TensileCreateLibrary.py +++ b/Tensile/TensileCreateLibrary.py @@ -1279,8 +1279,8 @@ def splitExtraParameters(par): theMasterLibrary = list(masterLibraries.values())[0] if args.EmbedLibrary is not None: - embedFileName = os.path.join(outputPath, "library/{}.cpp".format(args.EmbedLibrary)) - with EmbeddedData.EmbeddedDataFile(embedFileName) as embedFile: + embedFileNameTemp = os.path.join(outputPath, "library/{}.temp".format(args.EmbedLibrary)) + with EmbeddedData.EmbeddedDataFile(embedFileNameTemp) as embedFile: ext = ".yaml" if globalParameters["LibraryFormat"] == "yaml" else ".dat" embedFile.embed_file(theMasterLibrary.cpp_base_class, masterFile + ext, nullTerminated=True, @@ -1289,6 +1289,8 @@ def splitExtraParameters(par): for co in Utils.tqdm(codeObjectFiles): embedFile.embed_file("SolutionAdapter", co, nullTerminated=False, key=args.EmbedLibraryKey) + embedFileNameCpp = os.path.join(outputPath, "library/{}.cpp".format(args.EmbedLibrary)) + os.rename(embedFileNameTemp, embedFileNameCpp) if args.BuildClient: print1("# Building Tensile Client") diff --git a/Tensile/cmake/TensileConfig.cmake b/Tensile/cmake/TensileConfig.cmake index 1c853b44a..4eb49b69a 100644 --- a/Tensile/cmake/TensileConfig.cmake +++ b/Tensile/cmake/TensileConfig.cmake @@ -286,7 +286,7 @@ function(TensileCreateLibraryFiles COMMAND ${CommandLine} ) - set("${Tensile_VAR_PREFIX}_ALL_FILES" ${Tensile_MANIFEST_CONTENTS} PARENT_SCOPE) + set("${Tensile_VAR_PREFIX}_ALL_FILES" ${Tensile_EMBED_LIBRARY_SOURCE};${Tensile_MANIFEST_CONTENTS} PARENT_SCOPE) # Create a chained library build target. # We've declared the manifest contents as output of the custom @@ -295,7 +295,7 @@ function(TensileCreateLibraryFiles # command to be invoked at build time, not cmake time. TensileCreateCopyTarget( "${Tensile_VAR_PREFIX}_LIBRARY_TARGET" - "${Tensile_MANIFEST_CONTENTS}" + "${Tensile_EMBED_LIBRARY_SOURCE};${Tensile_MANIFEST_CONTENTS}" "${Tensile_OUTPUT_PATH}/library" ) From 8f81478e661adabb84c21f613b366b3d28244551 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Fri, 8 Dec 2023 10:25:11 -0700 Subject: [PATCH 17/51] Mode to dynamically adjust number of CUs used (#1835) --- Tensile/Common.py | 12 ++++ Tensile/Source/lib/include/Tensile/AMDGPU.hpp | 25 +++++++ .../include/Tensile/ContractionSolution.hpp | 1 + Tensile/Source/lib/source/AMDGPU.cpp | 6 ++ .../Source/lib/source/ContractionSolution.cpp | 72 +++++++++++-------- 5 files changed, 85 insertions(+), 31 deletions(-) diff --git a/Tensile/Common.py b/Tensile/Common.py index 26e0795d6..caf361fcb 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -1113,6 +1113,18 @@ def getArchitectureName(gfxName): # 1: Basic StreamK atomic (uses atomics to accumulate partial tiles) # 2: Basic StreamK non-atomic (uses workspace to store partial tiles, accumulate in deterministic fix-up step) # 3: Two-Tile StreamK (non-atomic, each WG completes an even number of sk iterations, followed by an even number of dp tiles) + # StreamK kernels can adjust the number of CUs being used. + # Using fewer sometimes increases overall throughput by allowing other kernels to run in parallel. + # StreamK grid is controlled by setting these enviornment variables: + # TENSILE_STREAMK_DYNAMIC_GRID enables dynamic grid mode, which automatically limits the number of CUs used for small + # problems to a subset based on the number of output tiles. + # 0 = off (default) + # 1 = on + # TENSILE_STREAMK_MAX_CUS allows the user to manually set maximum number of CUs used, which could free up some CUs for + # other operations to run in parallel with gemm. + # 0 = use all CUs (default) + # TENSILE_STREAMK_GRID_MULTIPLIER lets you set how many workgroups are created per CU being used. + # 1 = 1 WG per CU (default) "StreamK": [0, 1, 2, 3], # 0 : standard launch diff --git a/Tensile/Source/lib/include/Tensile/AMDGPU.hpp b/Tensile/Source/lib/include/Tensile/AMDGPU.hpp index 4c425e593..c845d7493 100644 --- a/Tensile/Source/lib/include/Tensile/AMDGPU.hpp +++ b/Tensile/Source/lib/include/Tensile/AMDGPU.hpp @@ -27,6 +27,7 @@ #pragma once #include +#include namespace Tensile { @@ -203,6 +204,9 @@ namespace Tensile int simdPerCu = 4; int computeUnitCount = 0; int isAPU = 0; + int skDynamicGrid = 0; + int skMaxCUs = 0; + int skGridMultiplier = 1; std::string deviceName; virtual bool runsKernelTargeting(Processor p) const; @@ -218,6 +222,27 @@ namespace Tensile virtual std::string description() const; + const int getSKDynamicGrid() const + { + static const char* envStr = std::getenv("TENSILE_STREAMK_DYNAMIC_GRID"); + static const int value = (envStr == NULL ? 0 : (std::atoi(envStr) == 0 ? 0 : 1)); + return value; + } + + const int getSKMaxCUs() const + { + static const char* envStr = std::getenv("TENSILE_STREAMK_MAX_CUS"); + static const int value = (envStr == NULL ? 0 : std::atoi(envStr)); + return value; + } + + const int getSKGridMultiplier() const + { + static const char* envStr = std::getenv("TENSILE_STREAMK_GRID_MULTIPLIER"); + static const int value = (envStr == NULL ? 1 : std::atoi(envStr)); + return value; + } + bool operator==(AMDGPU const& rhs) const { return processor == rhs.processor && computeUnitCount == rhs.computeUnitCount; diff --git a/Tensile/Source/lib/include/Tensile/ContractionSolution.hpp b/Tensile/Source/lib/include/Tensile/ContractionSolution.hpp index c04a8a27a..7cda789ac 100644 --- a/Tensile/Source/lib/include/Tensile/ContractionSolution.hpp +++ b/Tensile/Source/lib/include/Tensile/ContractionSolution.hpp @@ -202,6 +202,7 @@ namespace Tensile * Calculate required workspace size. */ size_t requiredWorkspaceSize(Problem const& problem, Hardware const& hardware) const; + size_t getSKGrid(Hardware const& hardware, size_t tiles) const; size_t partialTileSize(size_t skGrid) const; static float computeGranularity(float x); diff --git a/Tensile/Source/lib/source/AMDGPU.cpp b/Tensile/Source/lib/source/AMDGPU.cpp index ba50c9a4f..3f4eaa9fa 100644 --- a/Tensile/Source/lib/source/AMDGPU.cpp +++ b/Tensile/Source/lib/source/AMDGPU.cpp @@ -40,6 +40,9 @@ namespace Tensile , computeUnitCount(cus) , isAPU(apu) , deviceName(name) + , skDynamicGrid(getSKDynamicGrid()) + , skMaxCUs(getSKMaxCUs()) + , skGridMultiplier(getSKGridMultiplier()) { } @@ -49,6 +52,9 @@ namespace Tensile , computeUnitCount(cus) , isAPU(apu) , deviceName(name) + , skDynamicGrid(getSKDynamicGrid()) + , skMaxCUs(getSKMaxCUs()) + , skGridMultiplier(getSKGridMultiplier()) { } diff --git a/Tensile/Source/lib/source/ContractionSolution.cpp b/Tensile/Source/lib/source/ContractionSolution.cpp index d0e513534..161d3eca7 100644 --- a/Tensile/Source/lib/source/ContractionSolution.cpp +++ b/Tensile/Source/lib/source/ContractionSolution.cpp @@ -38,8 +38,6 @@ #include #include -#define TENSILE_STREAMK_GRID 1 - namespace Tensile { PerfModel perf; @@ -309,8 +307,6 @@ namespace Tensile rv.numWorkGroups.x = CeilDivide(rv.numWorkGroups.x, sizeMapping.macroTile.x); rv.numWorkGroups.y = CeilDivide(rv.numWorkGroups.y, sizeMapping.macroTile.y); - auto numTiles = rv.numWorkGroups; - uint32_t problemNumGroupTiles0 = rv.numWorkGroups.x; uint32_t problemNumGroupTiles1 = rv.numWorkGroups.y; // used only when persistent kernel along batch @@ -319,21 +315,21 @@ namespace Tensile rv.numWorkGroups.y *= sizeMapping.globalSplitU; size_t cuCount = 0; + size_t skGrid = 0; + auto tiles = problem.getNumTiles(sizeMapping); if(sizeMapping.streamK != 0 || sizeMapping.persistentKernel != 0) { AMDGPU const* pAMDGPU = dynamic_cast(&hardware); assert(pAMDGPU != nullptr && pAMDGPU->computeUnitCount != 0); cuCount = pAMDGPU->computeUnitCount; - } - - size_t skGrid = 0; - if(sizeMapping.streamK != 0) - { - skGrid = cuCount * TENSILE_STREAMK_GRID; - rv.numWorkGroups.x = skGrid; - rv.numWorkGroups.y = 1; - if(sizeMapping.persistentKernelAlongBatch) - rv.numWorkGroups.z = 1; + if(sizeMapping.streamK != 0) + { + skGrid = getSKGrid(hardware, tiles); + rv.numWorkGroups.x = skGrid; + rv.numWorkGroups.y = 1; + if(sizeMapping.persistentKernelAlongBatch) + rv.numWorkGroups.z = 1; + } } if(sizeMapping.persistentKernel != 0) @@ -621,7 +617,6 @@ namespace Tensile if(sizeMapping.streamK != 0) { auto itersPerTile = problem.getItersPerTile(sizeMapping); - auto tiles = problem.getNumTiles(sizeMapping); auto totalIters = tiles * itersPerTile; uint32_t magicNumberItersPerTile; uint32_t magicShiftItersPerTile; @@ -638,15 +633,19 @@ namespace Tensile } else if(sizeMapping.streamK == 3) // Two-tile SK { - uint32_t numOutputTiles = tiles; - bool bigEnough = numOutputTiles > skGrid; + bool bigEnough = tiles > skGrid; // skTiles is number of Stream-K tiles to complete // Two-tile algorithm causes each WG to run an even number of Stream-K iterations, - // followed by an even number of data-parllel tiles - uint32_t skTiles - = bigEnough ? skGrid + numOutputTiles % skGrid : numOutputTiles; - // Number of data-parallel tiles on each workgroup would be: - // dpTilesPerWG = bigEnough ? (numOutputTiles - skTiles) / skGrid : 0; + // followed by an even number of data-parllel tiles. + // If total tiles is evenly divisble by grid size, + // then no Stream-K tiles are needed, all data-parallel + uint32_t skTiles = skGrid; + if(tiles % skGrid != 0) + { + // Number of data-parallel tiles on each workgroup would be: + // dpTilesPerWG = bigEnough ? (tiles - skTiles) / skGrid : 0; + skTiles = bigEnough ? skGrid + tiles % skGrid : tiles; + } uint32_t skItersPerWG = skTiles * itersPerTile / skGrid; uint32_t skExtraIters = skTiles * itersPerTile % (skGrid); @@ -726,11 +725,9 @@ namespace Tensile rv.workGroupSize.y = 1; rv.workGroupSize.z = 1; - AMDGPU const* pAMDGPU = dynamic_cast(&hardware); - assert(pAMDGPU != nullptr && pAMDGPU->computeUnitCount != 0); - size_t cuCount = pAMDGPU->computeUnitCount; - size_t skGrid = cuCount * TENSILE_STREAMK_GRID; - size_t wiZ = 1; + auto tiles = problem.getNumTiles(sizeMapping); + size_t skGrid = getSKGrid(hardware, tiles); + size_t wiZ = 1; for(size_t i = 0; i < problem.batchIndices().size(); i++) wiZ *= problem.batchSize(i); size_t flagCount = skGrid * wiZ; @@ -1515,10 +1512,8 @@ namespace Tensile if(sizeMapping.streamK >= 2) { - AMDGPU const* pAMDGPU = dynamic_cast(&hardware); - assert(pAMDGPU != nullptr && pAMDGPU->computeUnitCount != 0); - size_t cuCount = pAMDGPU->computeUnitCount; - size_t skGrid = cuCount * TENSILE_STREAMK_GRID; + auto tiles = problem.getNumTiles(sizeMapping); + size_t skGrid = getSKGrid(hardware, tiles); // Get space required for partial tiles size += partialTileSize(skGrid); // Add space for flags @@ -1532,6 +1527,21 @@ namespace Tensile return size; } + size_t ContractionSolution::getSKGrid(Hardware const& hardware, size_t tiles) const + { + AMDGPU const* pAMDGPU = dynamic_cast(&hardware); + assert(pAMDGPU != nullptr && pAMDGPU->computeUnitCount != 0); + size_t cuCount = pAMDGPU->computeUnitCount; + size_t skGrid = cuCount; + if(pAMDGPU->skMaxCUs > 0) + skGrid = min(skGrid, pAMDGPU->skMaxCUs); + if(pAMDGPU->skDynamicGrid) + skGrid = min(skGrid, tiles); + if(pAMDGPU->skGridMultiplier > 1) + skGrid = skGrid * pAMDGPU->skGridMultiplier; + return skGrid; + } + size_t ContractionSolution::partialTileSize(size_t skGrid) const { size_t size = 0; From 213af91cee547c1267c1b12091d1fbf9174bc0b8 Mon Sep 17 00:00:00 2001 From: Babak Poursartip Date: Fri, 8 Dec 2023 17:57:42 -0600 Subject: [PATCH 18/51] update efficiency script for new architecture and xf32 datatype Co-authored-by: Babak --- tuning/automation/ConvertToEfficiency.py | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/tuning/automation/ConvertToEfficiency.py b/tuning/automation/ConvertToEfficiency.py index 6a1a53950..ce63bcbcd 100644 --- a/tuning/automation/ConvertToEfficiency.py +++ b/tuning/automation/ConvertToEfficiency.py @@ -39,6 +39,7 @@ def parseArgs(): "per-cu" : "If tuning was done per CU", \ "name" : "Name substring to filter which files are modified", \ "mfma" : "If MFMA instructions were used for tuning", \ + "x" : "to select A (default), or X node", \ "mi50" : "For vega20, if tuning was done on mi50" } @@ -49,6 +50,7 @@ def parseArgs(): argParser.add_argument("-p", "--per-cu", action="store_true", help=h["per-cu"]) argParser.add_argument("-n", "--name", type=str, help=h["name"]) argParser.add_argument("-m", "--mfma", action="store_true", help=h["mfma"]) + argParser.add_argument("-x", action="store_true", help=h["x"]) argParser.add_argument("--mi50", action="store_true", help=h["mi50"]) return argParser.parse_args() @@ -90,8 +92,12 @@ def main(): data = yaml.safe_load(y) sched = data[1] - type = DataType(data[4]["DataType"]).toChar() + if args.x: + sched+="X" + type = DataType(data[4]["DataType"]).toChar() + if type=="S" and data[4]["F32XdlMathOp"]==9: + type="X" if type in specs[sched][mfmaKey]: alu = specs[sched][mfmaKey][type] else: From 4532f2430eeb6ab54270647871625810932f63f7 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Wed, 13 Dec 2023 00:25:16 +0900 Subject: [PATCH 19/51] No reject for GlobalSplitU=1 + MultipleBuffer (#1847) - change GSUA to SingleBuffer instead of rejecting it --- Tensile/SolutionStructs.py | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index 5a51e65e1..7ac9885cd 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -3370,9 +3370,7 @@ def assignDerivedParameters(state): # to eliminate identical/duplicate kernels when GSU=1 if state["GlobalSplitU"] == 1: state["MinKForGSU"] = 256 - # GlobalSplitUAlgorithm is MultipleBuffer - if state["GlobalSplitUAlgorithm"] == 'MultipleBuffer': - reject(state, " GlobalSplitU=1 and GlobalSplitUAlgorithm='MultipleBuffer'. Rejecting GlobalSplitUAlgorithm='SingleBuffer' to avoid duplicate kernels.") + state["GlobalSplitUAlgorithm"] = 'SingleBuffer' # force to use SingleBuffer for GSU=1 (instead of rejecting it) # GlobalSplitUAtomicAdd is True if state["GlobalSplitUAtomicAdd"]: reject(state, " GlobalSplitU=1 and GlobalSplitUAtomicAdd=True. Rejecting to avoid duplicate kernels.") From f8bdfff410c68a7673338282190209a6dd23f011 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Tue, 12 Dec 2023 16:44:52 -0700 Subject: [PATCH 20/51] More cleanup on unused old client code (#1845) --- Tensile/BenchmarkProblems.py | 11 +- Tensile/SolutionWriter.py | 1074 ----------------- Tensile/TensileCreateLibrary.py | 31 +- .../Tests/unit/test_TensileCreateLibrary.py | 16 +- 4 files changed, 19 insertions(+), 1113 deletions(-) delete mode 100644 Tensile/SolutionWriter.py diff --git a/Tensile/BenchmarkProblems.py b/Tensile/BenchmarkProblems.py index 2fb094d60..7ae1c318b 100644 --- a/Tensile/BenchmarkProblems.py +++ b/Tensile/BenchmarkProblems.py @@ -40,8 +40,7 @@ from .KernelWriterAssembly import KernelWriterAssembly from .KernelWriterSource import KernelWriterSource from .SolutionStructs import Solution, ProblemType, ProblemSizes -from .SolutionWriter import SolutionWriter -from .TensileCreateLibrary import copyStaticFiles, writeSolutionsAndKernels +from .TensileCreateLibrary import copyStaticFiles, writeKernels from .CustomKernels import getCustomKernelConfig def generateForkedSolutions(problemType, constantParams, forkPermutations): @@ -142,20 +141,16 @@ def writeBenchmarkFiles(stepBaseDir, solutions, problemSizes, \ kernelHelperOjbs.append(ko) kernelHelperNames.add(kname) - solutionSerialNaming = Solution.getSerialNaming(solutions) kernelSerialNaming = Solution.getSerialNaming(kernels) - solutionMinNaming = Solution.getMinNaming(solutions) kernelMinNaming = Solution.getMinNaming(kernels) - solutionWriter = SolutionWriter(solutionMinNaming, \ - solutionSerialNaming, kernelMinNaming, kernelSerialNaming) kernelWriterSource = KernelWriterSource(kernelMinNaming, kernelSerialNaming) kernelWriterAssembly = KernelWriterAssembly(kernelMinNaming, kernelSerialNaming) # write solution, kernels and CMake problemType = solutions[0]["ProblemType"] - codeObjectFiles = writeSolutionsAndKernels( \ + codeObjectFiles = writeKernels( \ globalParameters["WorkingPath"], globalParameters["CxxCompiler"], \ - [problemType], solutions, kernels, kernelHelperOjbs, solutionWriter, \ + [problemType], solutions, kernels, kernelHelperOjbs, \ kernelWriterSource, kernelWriterAssembly, errorTolerant=True ) # ^ this is where solutions is mutated diff --git a/Tensile/SolutionWriter.py b/Tensile/SolutionWriter.py deleted file mode 100644 index 6780c52cd..000000000 --- a/Tensile/SolutionWriter.py +++ /dev/null @@ -1,1074 +0,0 @@ -################################################################################ -# -# Copyright (C) 2016-2022 Advanced Micro Devices, Inc. All rights reserved. -# -# Permission is hereby granted, free of charge, to any person obtaining a copy -# of this software and associated documentation files (the "Software"), to deal -# in the Software without restriction, including without limitation the rights -# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell -# copies of the Software, and to permit persons to whom the Software is -# furnished to do so, subject to the following conditions: -# -# The above copyright notice and this permission notice shall be included in -# all copies or substantial portions of the Software. -# -# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR -# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, -# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE -# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER -# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, -# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE -# SOFTWARE. -# -################################################################################ - -from .SolutionStructs import Solution, isPackedIndex -from .KernelWriterSource import KernelWriterSource -from .Common import globalParameters - -################################################################################ -# SolutionWriter -################################################################################ -class SolutionWriter: - - indexChars = globalParameters["IndexChars"] - - ############################################################################## - # SolutionWriter - ############################################################################## - def __init__(self, solutionMinNaming, solutionSerialNaming, \ - kernelMinNaming, kernelSerialNaming): - self.language = globalParameters["RuntimeLanguage"] - self.solutionMinNaming = solutionMinNaming - self.solutionSerialNaming = solutionSerialNaming - self.kernelMinNaming = kernelMinNaming - self.kernelSerialNaming = kernelSerialNaming - # only using getKernelName from KernelWriter so child doesn't matter - self.kernelWriter = KernelWriterSource( kernelMinNaming, kernelSerialNaming) - - self.streamName = "hipStream_t" if self.language == "HIP" \ - else "cl_command_queue" - self.eventName = "hipEvent_t" if self.language == "HIP" \ - else "cl_event" - # rocblas expects Tensile routines to return hip error codes - self.statusName = "TensileStatus" - self.strideList = [] - self.sizeList = [] - - - ############################################################################## - # get solution name - ############################################################################## - def getSolutionName(self, solution): - solutionName = Solution.getNameMin(solution, self.solutionMinNaming) - return solutionName - - ############################################################################## - # getSourceString - ############################################################################## - def getProblemSourceString(self, problemType, solution, kernelsWithBuildErrs): - gsu = solution["GlobalSplitU"] - persistent = solution["PersistentKernel"] - kernelLanguage = solution["KernelLanguage"] - tt0 = solution["ThreadTile0"] - tt1 = solution["ThreadTile1"] - sg0 = solution["SubGroup0"] - sg1 = solution["SubGroup1"] - nt = solution["NumThreads"] - - kernels = solution.getKernels() - kernelNames = [] - kernelBuildErr = 0 - for kernel in kernels: - kernelName = self.kernelWriter.getKernelName(kernel) - if kernelName in kernelsWithBuildErrs: - kernelBuildErr = 1 - kernelNames.append( kernelName ) - - - s = "" - t = "" - # includes - - problemType = solution["ProblemType"] # shortcut - - if not globalParameters["MergeFiles"]: - solutionName = self.getSolutionName(solution) - s += "#include \"%s.h\"\n" % solutionName - s += "\n" - - s += self.getSolutionSignature(solution) - - s += " {\n" - if kernelBuildErr: - s += "%s return tensileStatusFailure; // One or more kernels had build failures (%s)\n" % (t, kernelNames) - s += "%s}\n" % (t) - return s - - t += " " - s += "%sTensileStatus status;\n" % (t) - - - # hipFunction Struct - if kernelLanguage == "Assembly": - s += "\n" - s += "%s/* module function args */\n" % (t) - s += "%sstruct {\n" % t - t += " " - if globalParameters["DebugKernel"]: - s += "%sunsigned int *debugBuffer;\n" % t - # Tensor sizes in elements, including only packed dims, - # and accounting for zero or other strides < size - # Place these first in the structure since they are 64-bits - # and need to avoid any unneeded padding: - s += "%s// Size of Tensor's packed dims, in elements\n" % t - s += "%suint64_t tensor2dSizeC;\n" % t - s += "%suint64_t tensor2dSizeA;\n" % t - s += "%suint64_t tensor2dSizeB;\n" % t - solutionArgs = self.getArgList(problemType, False, True, False, False, False, solution["_GlobalAccumulation"]) - for arg in solutionArgs: - if arg[0] == "TensileHalf": - s += "%s%s %s[2];\n" % (t, arg[0], arg[1]) - else: - s += "%s%s %s;\n" % (t, arg[0], arg[1]) - for idxChar in solution["PackedC0IdxChars"][:-1]: - s += "%sunsigned magicNumberSize%s;\n" % (t, idxChar) - s += "%sunsigned magicShiftSize%s;\n" % (t, idxChar) - for idxChar in solution["PackedC1IdxChars"][:-1]: - s += "%sunsigned magicNumberSize%s;\n" % (t, idxChar) - s += "%sunsigned magicShiftSize%s;\n" % (t, idxChar) - - # number of unroll loop iterations to stagger the start in "U" dim. - s += "%sint staggerUIter;\n" % t - - # persistent - s += "%sunsigned int problemNumGroupTiles0;\n" % t - s += "%sunsigned int problemNumGroupTiles1;\n" % t - s += "%sunsigned int magicNumberProblemNumGroupTiles0;\n" % t - s += "%sunsigned int gridNumWorkGroups0;\n" % t - s += "%sunsigned int numFullBlocks;\n" % t - s += "%sunsigned int wgmRemainder1;\n" % t - s += "%sunsigned int magicNumberWgmRemainder1;\n" % t - - s += "%sunsigned int pad;\n" % t # FIXME can this be removed? - t = t[2:] - s += "%s} hipFunctionArgs;\n" % t - #s += "%sprintf(\"hipFunctionArgsSize: %%lu\\n\", sizeof(hipFunctionArgs));\n" % t - s += "%ssize_t hipFunctionArgsSize = sizeof(hipFunctionArgs);\n" % t - s += "%svoid *hipLaunchParams[] = {HIP_LAUNCH_PARAM_BUFFER_POINTER, &hipFunctionArgs, HIP_LAUNCH_PARAM_BUFFER_SIZE, &hipFunctionArgsSize, HIP_LAUNCH_PARAM_END};\n" % t - #s += "%sprintf(\"size: %%lu\\n\", sizeof(unsigned int));\n" % t - #s += "%sprintf(\"hipFunctionArgsSize: %%lu\\n\", sizeof(hipFunctionArgs));\n" % t - #for arg in solutionArgs: - # s += "%sprintf(\"%s: %%lu\\n\", static_cast(static_cast(&hipFunctionArgs.%s)) - static_cast(static_cast(&hipFunctionArgs.%s)));\n" % (t, arg[1], arg[1], solutionArgs[0][1]) - - # NOTE: host compiler aligns size of structs to 64-bits (at least) and aligns the offset of pointers to 64-bits, therefore, having pointers which are not at the beginning of the struct may get padded/shifted by the host compiler and, therefore, not coppied correctly to gpu - - if globalParameters["RuntimeLanguage"] == "HIP": - s += "%sint deviceId;\n" % (t) - s += "%shipGetDevice(&deviceId);\n" % (t) - - # kernels - s += "\n%s/* kernels */\n" % (t) - s += "%sconst unsigned int numKernels = %u; // 1 or 4\n" % (t, len(kernels)) - - if kernelLanguage == "Source" and globalParameters["RuntimeLanguage"] == "OCL": - s += "%sconst char *kernelSources[numKernels] = {\n" % (t) - t += " " - for kernelIdx in range(0, len(kernelNames)): - kernelName = kernelNames[kernelIdx] - s += "%s%s_src%s\n" % (t, kernelName, \ - "," if kernelIdx < len(kernels)-1 else "" ) - t = t[2:] - s += "%s};\n" % (t) - s += "%scl_kernel kernels[numKernels];\n" % (t) - s += "%sconst char *buildOptions = \"-cl-std=cl2.0\";\n" % (t) - s += "%sfor (unsigned int i = 0; i < numKernels; i++) {\n" % (t) - s += "%s tensileGetCompiledOpenCLKernel(\n" % (t) - s += "%s &kernels[i],\n" % (t) - s += "%s kernelSources[i],\n" % (t) - s += "%s stream,\n" % (t) - s += "%s buildOptions);\n" % (t) - s += "%s}\n" % (t) - - if gsu > 1: - for ko in solution.getKernelBetaOnlyObjects(): - kernelName = ko.getKernelName(ko) - s += "%scl_kernel kernel_%s;\n" % (t, kernelName) - s += "%s tensileGetCompiledOpenCLKernel(\n" % (t) - s += "%s &kernel_%s,\n" % (t, kernelName) - s += "%s %s_src,\n" % (t, kernelName) - s += "%s stream,\n" % (t) - s += "%s buildOptions);\n" % (t) - - elif kernelLanguage == "Assembly": - kernel = kernels[0] - s += "%shipFunction_t hipFunction;\n" % (t) - # if !CodeFromFiles then pass global _coba that points to code object - s += "%sstatus = solutionLock->getFunction(&hipFunction, deviceId, \"%s\", %s);;\n" \ - % (t, kernelName, "nullptr" if globalParameters["CodeFromFiles"] else kernelName+"_coba" ) - s += "%sif (status) return status;\n" % (t) - - typeName = problemType["DataType"].toCpp() - - # num enqueues - s += "\n%s/* num kernels */\n" % (t) - s += "%sunsigned int numEnqueues[numKernels] = { 1" % (t) - for i in range(1, len(kernels)): - s += ", 1" - s += " };\n" - - # grid size - s += "\n%s/* grid sizes */\n" % (t) - s += "%sconst unsigned int workDim = 3;\n" % (t) - s += "%sconst unsigned int threadTile[2] = { %u, %u };\n" \ - % (t, tt0, tt1) - s += "%sconst unsigned int groupSize[2] = { %u, %u };\n" \ - % (t, sg0, sg1) - s += "%ssize_t localWorkSize[3] = { %3u, 1, 1 };\n" \ - % (t, nt) - s += "%ssize_t globalWorkSize[numKernels][3];\n" % (t) - # grid size [2] - s += "%sglobalWorkSize[0][2] = 1;\n" % (t) - for i in range(0, problemType["NumIndicesC"]): - if i != problemType["Index0"] and i != problemType["Index1"] \ - and not isPackedIndex(solution,i): - s += "%sglobalWorkSize[0][2] *= size%s;\n" % (t, self.indexChars[i]) - - s += "%sunsigned int sizeOfC0 = " % (t) - s += " * ".join(["size" + i for i in solution["PackedC0IdxChars"]]) - s += ";\n" - - s += "%sunsigned int sizeOfC1 = " % (t) - s += " * ".join(["size" + i for i in solution["PackedC1IdxChars"]]) - s += ";\n" - - for idxChar in solution["PackedC0IdxChars"][:-1]: - s += "%sunsigned magicShiftSize%s = 33; // bozo, review\n" % (t, idxChar) - s += "%suint64_t magicNumberSize%s = (1L< 0: - s += "%sunsigned numFullBlocks = problemNumGroupTiles1 / %u; // divide by WorkGroupMapping\n" % (t, kernel["WorkGroupMapping"]) - s += "%sunsigned wgmRemainder1 = problemNumGroupTiles1 %% %u;\n" % (t, kernel["WorkGroupMapping"]) - s += "%sif (wgmRemainder1 == 0) wgmRemainder1 = %u;\n" % (t, kernel["WorkGroupMapping"]) - s += "%sunsigned magicNumberWgmRemainder1 = ((1L< 1: - s += "%stotalWorkGroups1 *= %u; // GlobalSplitU\n" % (t, gsu) - if persistent: - s += "%shipDeviceProp_t deviceProperties;\n" % (t) - # TODO - should cache the device properties - expensive to call on each iteration here: - s += "%shipGetDeviceProperties( &deviceProperties, deviceId );\n" % (t) - s += "#if HIP_VERSION >= 50220730\n" - s += "%sint hip_version;\n" % (t) - s += "%shipRuntimeGetVersion(&hip_version);\n" % (t) - s += "%sif(hip_version >= 50220730)\n" % (t) - s += "%s{\n" % (t) - s += "%s hipDeviceGetAttribute(&deviceProperties.multiProcessorCount,\n" % (t) - s += "%s hipDeviceAttributePhysicalMultiProcessorCount,\n" % (t) - s += "%s deviceId);\n" % (t) - s += "%s}\n" % (t) - s += "#endif\n" - s += "%sunsigned int numGroups = totalWorkGroups0 * totalWorkGroups1;\n" % (t) - s += "%sglobalWorkSize[0][0] = (deviceProperties.multiProcessorCount * %u < numGroups) ? (deviceProperties.multiProcessorCount * %u) : numGroups;\n" \ - % (t, persistent, persistent) - - s += "%sglobalWorkSize[0][1] = 1;\n" % t - else: - s += "%sglobalWorkSize[0][0] = totalWorkGroups%u%s;\n" % (t, 0 if kernel["WorkGroupMapping"] >= 0 else 1, "*localWorkSize[0]" if self.language == "OCL" else "") - s += "%sglobalWorkSize[0][1] = totalWorkGroups%u%s;\n" % (t, 1 if kernel["WorkGroupMapping"] >= 0 else 0, "*localWorkSize[1]" if self.language == "OCL" else "") - - # index sizes - s += "\n%s/* index sizes */\n" % (t) - s += "%sunsigned int sizes[numKernels][1][%u];\n" \ - % (t, problemType["TotalIndices"]) - for kernelIdx in range(0, len(kernels)): - kernel = kernels[kernelIdx] - kernelName = self.kernelWriter.getKernelName(kernel) - # free index sizes - for i in range(0,problemType["NumIndicesFree"] \ - + problemType["NumIndicesBatch"] ): - s += "%ssizes[%u][0][%u] = size%s;\n" \ - % (t, kernelIdx, i, self.indexChars[i]) - # summation index sizes - for i in range(problemType["NumIndicesC"], \ - problemType["TotalIndices"] ): - lastParam = i == problemType["TotalIndices"]-1 - s += "%ssizes[%u][0][%u] = size%s;\n" \ - % (t, kernelIdx, i, self.indexChars[i]) - - # Tensor2DSizes - size excluding the batch dimension, accounts for cases where one of strides is 0 - #print "IndexAssignmentsA=", problemType["IndexAssignmentsA"], "Batch=", problemType["IndicesBatch"] - firstStride = 0 if problemType["UseInitialStridesCD"] else 1 - del i - - numIdx = problemType["NumIndicesC"] - printMe = 0 - s += "%suint64_t tensor2dSizeC = %s" % \ - (t, "1" if firstStride==1 else "strideC%u%s"% (0,self.indexChars[0])) - for idx in range(0,numIdx): - # Multiply only by packed tensor dims - if idx in problemType["IndicesFree"]: - printMe = True - else: - printMe = False - - if printMe: - if idx+1 < numIdx: - strideIdx = idx+1 - s += " * std::max(size%s, strideC%u%s)" % \ - (self.indexChars[idx], idx+1, self.indexChars[strideIdx]) - else: - s += " * size%s" % (self.indexChars[idx]) - s += ";\n" - - s += "%suint64_t tensor2dSizeA = 1;\n" % t - s += "%suint64_t tensor2dSizeAStride = 0;\n" % t - s += "%suint64_t tensor2dSizeAOffset = 0;\n" % t - numIdx = len(problemType["IndexAssignmentsA"]) - - printMe = False - for i in range(0,numIdx): - idx = problemType["IndexAssignmentsA"][i] - - # Don't multiple batch dimensions that will be backed into SRD: - if idx in solution["PackedC0IndicesX"]: - printMe = True - elif idx in problemType["IndicesSummation"]: - printMe = True - else: - printMe = False - - if printMe: - if i+1 < numIdx: - strideIdx = problemType["IndexAssignmentsA"][i+1] - s += "%stensor2dSizeAStride = std::max(tensor2dSizeA*size%s, (uint64_t)strideA%u%s);\n" \ - % (t, self.indexChars[idx], i+1, self.indexChars[strideIdx]) - s += "%stensor2dSizeAOffset += tensor2dSizeAStride - tensor2dSizeA*size%s;\n" \ - % (t, self.indexChars[idx]) - s += "%stensor2dSizeA = tensor2dSizeAStride;\n" % (t) - else: - s += "%stensor2dSizeA = tensor2dSizeA * size%s;\n" % (t, self.indexChars[idx]) - - s += "%stensor2dSizeA -= tensor2dSizeAOffset;\n" % t - s += "\n" - - s += "%suint64_t tensor2dSizeB = 1;\n" % t - s += "%suint64_t tensor2dSizeBStride = 0;\n" % t - s += "%suint64_t tensor2dSizeBOffset = 0;\n" % t - numIdx = len(problemType["IndexAssignmentsB"]) - printMe = False - for i in range(0,numIdx): - idx = problemType["IndexAssignmentsB"][i] - - # Multiply only by first free and first summation - if idx in solution["PackedC1IndicesX"]: - printMe = True - elif idx in problemType["IndicesSummation"]: - printMe = True - else: - printMe = False - - if printMe: - if i+1 < numIdx: - strideIdx = problemType["IndexAssignmentsB"][i+1] - s += "%stensor2dSizeBStride = std::max(tensor2dSizeB*size%s, (uint64_t)strideB%u%s);\n" \ - % (t, self.indexChars[idx], i+1, self.indexChars[strideIdx]) - s += "%stensor2dSizeBOffset += tensor2dSizeBStride - tensor2dSizeB*size%s;\n" \ - % (t, self.indexChars[idx]) - s += "%stensor2dSizeB = tensor2dSizeBStride;\n" % (t) - else: - s += "%stensor2dSizeB = tensor2dSizeB * size%s;\n" % (t, self.indexChars[idx]) - - s += "%stensor2dSizeB -= tensor2dSizeBOffset;\n" % t - s += "\n" - - unrollChar = globalParameters["IndexChars"][problemType["IndexUnroll"]] - - s += " unsigned int staggerUIter = %s; // how many stride-sized clicks to stagger start offset\n" \ - % (solution["StaggerU"]) - s += " int unrollLoopIters = size%s/%u/%u; // /DepthU/GSU\n" % (unrollChar, solution["DepthU"], gsu) - s += " while (staggerUIter>1) {\n" - s += " if (unrollLoopIters >= (staggerUIter*%u)) {\n" % (1< 1: - s += "%ssize_t sizeOfC = sizeOfC0 * sizeOfC1;\n" % (t) - for i in range(0, problemType["NumIndicesC"]): - if i != problemType["Index0"] and i != problemType["Index1"]: - s += "%ssizeOfC *= size%s;\n" % (t, self.indexChars[i]) - - ######################################## - # Enqueue Beta-Only Kernel - ######################################## - if gsu > 1 and kernel["_GlobalAccumulation"] != 'MultipleBuffer': - kernelNamesBetaOnly = [] - for ko in solution.getKernelBetaOnlyObjects(): - kernelName = ko.getKernelName() - kernelNamesBetaOnly.append(kernelName) - s += "%s// enqueue Beta-Only kernel\n" % (t) - - # grid sizes - s += "%ssize_t localWorkSizeBetaOnly[3] = { 256, 1, 1};\n" % (t) - s += "%ssize_t globalWorkSizeBetaOnly[3] = { 1, 1, 1};\n" % (t) - s += "%sglobalWorkSizeBetaOnly[0] = (sizeOfC + globalWorkSizeBetaOnly[0] - 1) / globalWorkSizeBetaOnly[0];\n" % (t) - s += "%s// b/c single kernel, add extra work-group here if edge needed\n" % (t) - - if problemType["UseBeta"]: - s += "%sbool betaZero = beta == (%s)0;\n" % (t, typeName) - if self.language == "OCL": - if problemType["UseBeta"]: - s += "%scl_kernel kernelBetaOnly = betaZero ? kernel_%s : kernel_%s;\n" \ - % (t, kernelNamesBetaOnly[0], kernelNamesBetaOnly[1]) - else: - #s += "%sbool betaZero = true;\n" % (t) - s += "%scl_kernel kernelBetaOnly = kernel_%s;\n" \ - % (t, kernelNamesBetaOnly[0]) - argIdx = 0 - s += "%sstatus = clSetKernelArg( kernelBetaOnly, %u, sizeof(cl_mem), &dataC ); tensileStatusCheck(status);\n" % (t, argIdx); argIdx+=1 - # strides - for i in range(0,numStridesC): - s += "%sstatus = clSetKernelArg( kernelBetaOnly, %u, sizeof(unsigned int), &%s ); tensileStatusCheck(status);\n" % (t, argIdx, self.strideList[i]); argIdx+=1 - # sizes - for i in range(0, problemType["NumIndicesC"]): - s += "%sstatus = clSetKernelArg( kernelBetaOnly, %u, sizeof(unsigned int), &size%s ); tensileStatusCheck(status);\n" % (t, argIdx, self.indexChars[i]); argIdx+=1 - # beta - if problemType["UseBeta"]: - s += "%sif (!betaZero) {\n" % (t) - s += "%s status = clSetKernelArg( kernelBetaOnly, %u, sizeof(%s), &beta ); tensileStatusCheck(status);\n" % (t, argIdx, typeName); argIdx+=1 - s += "%s}\n" % (t) - # enqueue - s += "%scl_event kernelEventBetaOnly;\n" % (t) - s += "%sstatus = clEnqueueNDRangeKernel(\n" % (t) - t += " " - s += "%sstream,\n" % (t) - s += "%skernelBetaOnly,\n" % (t) - s += "%sworkDim,\n" % (t) - s += "%sNULL, // globalWorkOffset\n" % (t) - s += "%sglobalWorkSizeBetaOnly,\n" % (t) - s += "%slocalWorkSizeBetaOnly,\n" % (t) - s += "%snumInputEvents,\n" % (t) - s += "%sinputEvents,\n" % (t) - #s += "%soutputEvent );\n" % (t) - s += "%s&kernelEventBetaOnly );\n" % (t) - t = t[2:] - s += "%stensileStatusCheck(status);\n" % (t) - if problemType["UseBeta"]: - s += "%sbeta = %s;\n" % (t, problemType["DataType"].zeroString(self.language, 1) ) - #s += "%sreturn tensileStatusSuccess;\n" % (t) - s += "%sstatus = clFinish(stream);\n" % (t) - s += "%stensileStatusCheck(status);\n" % (t) - #s += " float tmp[128*128];\n" - #s += "clEnqueueReadBuffer(stream, dataC, CL_TRUE, 0, 128*128*sizeof(float), tmp, 0, NULL, NULL);\n" - #s += "for (unsigned int i = 0; i < 128*128; i++) { printf(\"%f\\n\", tmp[i]); }\n" - else: - s += "%stry {\n" % (t) - t += " " - # TODO - timing with beta kernels is somewhat pessimistic since it has this separate event only on the GSU path. - # Introduces 2-3us of overhead ; may want to disable PreciseKernelTime so non-GSU have same overhead. - # Long-term fix would be to launch the beta kernel with the hipHccModule* API and set start-event in that call - s += "%sif( inputEvents != NULL )\n" % (t) - s += "%s hipEventRecord(inputEvents[0], stream );\n" % (t) - s += "%skernelsLaunched++;\n" % (t) - s += "%shipLaunchKernelGGL(\n" % (t) - t += " " - s += "%sHIP_KERNEL_NAME(%s),\n" % (t, kernelNamesBetaOnly[0]) - s += "%sdim3(globalWorkSizeBetaOnly[0], globalWorkSizeBetaOnly[1], globalWorkSizeBetaOnly[2]),\n" % (t) - s += "%sdim3(localWorkSizeBetaOnly[0], localWorkSizeBetaOnly[1], localWorkSizeBetaOnly[2]),\n" % (t) - s += "%s0, // groupMemBytes\n" % (t) - s += "%sstream,\n" % (t) - s += "%sworkspace,\n" % (t) if solution["_GlobalAccumulation"] else ("%sdataD,\n" % (t)) - s += "%sdataC,\n" % (t) - # strides - if kernel["_GlobalAccumulation"]: - for i in range(0, numStridesC): - s += "%s%s,\n" % (t, WSstrides[i]) - else: - for i in range(0, numStridesC): - s += "%s%s,\n" % (t, self.strideList[i]) - for i in range(numStridesC, numStridesC*2): - s += "%s%s,\n" % (t, self.strideList[i]) - # sizes - for i in range(0, problemType["NumIndicesC"]): - s += "%ssize%s,\n" % (t, self.indexChars[i]) - s += ("%sbeta);\n" % (t)) if problemType["UseBeta"] else ("%s0.0f);\n" % (t)) - t = t[:-2] - - t = t[:-2] - s += "%s} catch (const std::exception& e) {\n" % (t) - t += " " - s += "#ifdef DEBUG\n" - s += "%s std::cerr << e.what() << std::endl;\n" % (t) - s += "#endif\n" - s += "%s return tensileStatusFailure;\n" % (t) - t = t[:-2] - s += "%s}\n" % (t) - - ######################################## - # Enqueue Kernels - ######################################## - for kernelIdx in range(0, len(kernels)): - kernel = kernels[kernelIdx] - if kernel["KernelLanguage"] == "Source": - kernel["ISA"] = [0, 0, 0] # HIP source kernels needs dummy ISA version - kernelName = self.kernelWriter.getKernelName(kernel) - s += "\n%s/* kernel %u: %s */\n" % (t, kernelIdx, kernelName) - s += "%sunsigned int kernelIdx = %u;\n" % (t, kernelIdx) - if self.language == "OCL": - # set kernel args same for all enqueues - s += "%s// kernel args same for all enqueues\n" % (t) - s += "%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(cl_mem), &dataD ); tensileStatusCheck(status);\n" % (t, 0) - s += "%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(cl_mem), &dataC ); tensileStatusCheck(status);\n" % (t, 1) - s += "%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(cl_mem), &dataA ); tensileStatusCheck(status);\n" % (t, 2) - s += "%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(cl_mem), &dataB ); tensileStatusCheck(status);\n" % (t, 3) - s += "%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(%s), &alpha ); tensileStatusCheck(status);\n" % (t, 4, typeName) - s += "%s%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(%s), &beta ); tensileStatusCheck(status);\n" % (t, \ - "" if problemType["UseBeta"] else "//", 5, typeName) - argIdx = 6 if problemType["UseBeta"] else 5 - for stride in self.strideList: - s += "%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(unsigned int), &%s ); tensileStatusCheck(status);\n" % (t, argIdx, stride) - argIdx += 1 - for sizeIdx in range(0, problemType["TotalIndices"]): - if sizeIdx not in [ problemType["Index0"], problemType["Index1"], problemType["IndexUnroll"] ]: - s += "%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(unsigned int), &size%s ); tensileStatusCheck(status);\n" % (t, argIdx, self.indexChars[sizeIdx]) - argIdx += 1 - - s += "%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(staggerUIter), &staggerUIter ); tensileStatusCheck(status);\n" % (t, argIdx) - argIdx += 1 - - s += "%sfor (unsigned int enqueueIdx = 0; enqueueIdx < numEnqueues[%u]; enqueueIdx++) {\n" % (t, kernelIdx) - t += " " - # debug print kernel dimensions - if globalParameters["LibraryPrintDebug"]: - s += "%sprintf(\"%s: g{ %%u, %%u, %%u } l{ %%u, %%u, %%u}\\n\", static_cast(globalWorkSize[kernelIdx][0]), static_cast(globalWorkSize[kernelIdx][1]), static_cast(globalWorkSize[kernelIdx][2]), static_cast(localWorkSize[0]), static_cast(localWorkSize[1]), static_cast(localWorkSize[2]) );\n" % (t, kernelName) - # debug print kernel arguments - # strides - for stride in self.strideList: - s += "%sprintf(\" %s = %%u\\n\", %s);\n" % (t, stride, stride) - # sizes - for i in range(0, problemType["TotalIndices"]): - s += "%sprintf(\" sizes[kernelIdx][enqueueIdx][%u] = %%u\\n\", sizes[kernelIdx][enqueueIdx][%u] );\n" % (t, i, i ) - s += "%sprintf(\" staggerUIter == %%u\\n\", staggerUIter );\n" % (t) - s += "%sprintf(\" problemNumGroupTiles0== %%u\\n\", problemNumGroupTiles0 );\n" % (t) - s += "%sprintf(\" problemNumGroupTiles1== %%u\\n\", problemNumGroupTiles1 );\n" % (t) - s += "%sprintf(\" tensor2dSizeC== %%lu\\n\", tensor2dSizeC );\n" % (t) - s += "%sprintf(\" tensor2dSizeA== %%lu\\n\", tensor2dSizeA );\n" % (t) - s += "%sprintf(\" tensor2dSizeB== %%lu\\n\", tensor2dSizeB );\n" % (t) - for idxChar in solution["PackedC0IdxChars"][:-1]: - s += "%sprintf(\" magicNumberSize%s== 0x%%lx, magicShiftSize%s== %%u)\\n\", magicNumberSize%s, magicShiftSize%s);\n" \ - % (t, idxChar, idxChar, idxChar, idxChar) - for idxChar in solution["PackedC1IdxChars"][:-1]: - s += "%sprintf(\" magicNumberSize%s== 0x%%x, magicShiftSize%s== %%u)\\n\", magicNumberSize%s, magicShiftSize%s);\n" \ - % (t, idxChar, idxChar, idxChar, idxChar) - s += "%sprintf(\" magicNumberProblemNumGroupTiles0==%%u\\n\", magicNumberProblemNumGroupTiles0);\n" % t - - ######################################## - # OpenCL Runtime - ######################################## - if self.language == "OCL": - # set kernel args different for all enqueues - argIdx = 6 if problemType["UseBeta"] else 5 - argIdx += len(self.strideList) - # sizes - for sizeIdx in range(0, problemType["TotalIndices"]): - if sizeIdx in [ problemType["Index0"], problemType["Index1"], problemType["IndexUnroll"] ]: - s += "%sstatus = clSetKernelArg( kernels[kernelIdx], %u, sizeof(unsigned int), &size%s ); tensileStatusCheck(status);\n" % (t, argIdx, self.indexChars[sizeIdx]) - argIdx += 1 - - # enqueue - s += "%sstatus = clEnqueueNDRangeKernel(\n" % (t) - t += " " - s += "%sstream,\n" % (t) - s += "%skernels[kernelIdx],\n" % (t) - s += "%sworkDim,\n" % (t) - s += "%sNULL, // globalWorkOffset\n" % (t) - s += "%sglobalWorkSize[kernelIdx],\n" % (t) - s += "%slocalWorkSize,\n" % (t) - if False: # gsu > 1: - s += "%s1,\n" % (t) - s += "%s&kernelEventBetaOnly,\n" % (t) - else: - s += "%snumInputEvents,\n" % (t) - s += "%sinputEvents,\n" % (t) - s += "%soutputEvent );\n" % (t) - s += "%stensileStatusCheck(status);\n" % (t) - t = t[:-2] - s += "%s}\n" % (t) - - ######################################## - # HIP Runtime - ######################################## - else: - - if not globalParameters["PreciseKernelTime"] or kernelLanguage == "Source": - s += "%sif( inputEvents != NULL )\n" % (t) - t += " " - s += "%shipEventRecord(inputEvents[enqueueIdx], stream );\n" % (t) - s += "%stry {\n" % (t) - t += " " - # hip kernel - if kernelLanguage == "Source": - s += "%skernelsLaunched++;\n" % (t) - s += "%shipLaunchKernelGGL(\n" % (t) - t += " " - s += "%sHIP_KERNEL_NAME(%s),\n" % (t, kernelName) - s += "%sdim3(globalWorkSize[kernelIdx][0], globalWorkSize[kernelIdx][1], globalWorkSize[kernelIdx][2]),\n" % (t) - s += "%sdim3(localWorkSize[0], localWorkSize[1], localWorkSize[2]),\n" % (t) - s += "%s0, // groupMemBytes\n" % (t) - s += "%sstream,\n" % (t) - s += ("%sdataD,\n") % (t) if not solution["_GlobalAccumulation"] else ("%sworkspace,\n" % (t)) - s += ("%sdataC,\n") % (t) if not solution["_GlobalAccumulation"] else ("%sworkspace,\n" % (t)) - s += "%sdataA,\n" % (t) - s += "%sdataB,\n" % (t) - s += "%salpha,\n" % (t) - s += "%s%sbeta,\n" % (t, \ - "" if problemType["UseBeta"] else "//") - # strides - if kernel["_GlobalAccumulation"]: - for i in range(0, numStridesC): - s += "%s%s,\n" % (t, WSstrides[i]) - for i in range(0, numStridesC): - s += "%s%s,\n" % (t, WSstrides[i]) - for i in range(numStridesC*2, len(self.strideList)): - s += "%s%s,\n" % (t, self.strideList[i]) - else: - for stride in self.strideList: - s += "%s%s,\n" % (t, stride) - # sizes - for i in range(0, problemType["TotalIndices"]): - lastParam = i == problemType["TotalIndices"]-1 - s += "%ssizes[kernelIdx][enqueueIdx][%u]%s\n" \ - % (t, i, "" if lastParam else "," ) - for idxChar in solution["PackedC0IdxChars"][:-1]: - s += "%s,static_cast(magicNumberSize%s)\n" % (t, idxChar) - s += "%s,magicShiftSize%s\n" % (t, idxChar) - for idxChar in solution["PackedC1IdxChars"][:-1]: - s += "%s,static_cast(magicNumberSize%s)\n" % (t, idxChar) - s += "%s,magicShiftSize%s\n" % (t, idxChar) - s += "%s,staggerUIter\n" % (t) - #persistent: - s += "%s,problemNumGroupTiles0\n" % (t) - s += "%s,problemNumGroupTiles1\n" % (t) - s += "%s,magicNumberProblemNumGroupTiles0\n" % (t) # magic number to use when dividing by problemNumGroupTiles0 - s += "%s);\n" % (t) - t = t[:-2] - # assembly kernel - else: - if globalParameters["DebugKernel"]: - s += "%sconst unsigned int debugBufferElementsPerThread = 16;\n" % t - s += "%sunsigned int debugBufferNumElem = debugBufferElementsPerThread;\n" % (t) - s += "%sdebugBufferNumElem *= max(1,globalWorkSize[kernelIdx][0]);\n" % (t) - s += "%sdebugBufferNumElem *= max(1,globalWorkSize[kernelIdx][1]);\n" % (t) - s += "%sdebugBufferNumElem *= max(1,globalWorkSize[kernelIdx][2]);\n" % (t) - s += "%sdebugBufferNumElem *= localWorkSize[0];\n" % (t) - s += "%sdebugBufferNumElem *= localWorkSize[1];\n" % (t) - s += "%sdebugBufferNumElem *= localWorkSize[2];\n" % (t) - s += "%s printf(\"debugBufferNumElem: %%04i: \\n\", debugBufferNumElem);\n" % (t) - s += "%ssize_t debugBufferSize = debugBufferNumElem * sizeof(unsigned int);\n" % (t) - s += "%shipDevice_t device;\n" % t - s += "%shipDeviceGet(&device, 0);\n" % t - s += "%shipMalloc(&(hipFunctionArgs.debugBuffer), debugBufferSize);\n" % t - s += "%sunsigned int *debugBufferHostPtr = new unsigned int[debugBufferNumElem];\n" % (t) - s += "%smemset(debugBufferHostPtr,0,debugBufferSize);\n" % (t) - s += "%shipMemcpyHtoD(hipFunctionArgs.debugBuffer, debugBufferHostPtr, debugBufferSize);\n" % (t) - s += "%smemset(debugBufferHostPtr,1,debugBufferSize);\n" % (t) - - # hip assembly function - s += "%shipFunctionArgs.tensor2dSizeC = tensor2dSizeC;\n" % (t) - s += "%shipFunctionArgs.tensor2dSizeA = tensor2dSizeA;\n" % (t) - s += "%shipFunctionArgs.tensor2dSizeB = tensor2dSizeB;\n" % (t) - - if solution["_GlobalAccumulation"]: - s += "%shipFunctionArgs.dataD = workspace;\n" % (t) - s += "%shipFunctionArgs.dataC = workspace;\n" % (t) - else: - s += "%shipFunctionArgs.dataD = dataD;\n" % (t) - s += "%shipFunctionArgs.dataC = dataC;\n" % (t) - s += "%shipFunctionArgs.dataA = dataA;\n" % (t) - s += "%shipFunctionArgs.dataB = dataB;\n" % (t) - - if problemType["ComputeDataType"].isHalf(): - s += "%shipFunctionArgs.alpha[0] = alpha;\n" % (t) - s += "%shipFunctionArgs.alpha[1] = alpha;\n" % (t) - else: - s += "%shipFunctionArgs.alpha = alpha;\n" % (t) - if problemType["UseBeta"]: - if problemType["ComputeDataType"].isHalf(): - s += "%shipFunctionArgs.beta[0] = beta;\n" % (t) - s += "%shipFunctionArgs.beta[1] = beta;\n" % (t) - else: - s += "%shipFunctionArgs.beta = beta;\n" % (t) - # strides - if kernel["_GlobalAccumulation"]: - for i in range(0, numStridesC): - s += "%shipFunctionArgs.%s = %s;\n" % (t, self.strideList[i], WSstrides[i]) - for i in range(0, numStridesC): - s += "%shipFunctionArgs.%s = %s;\n" % (t, self.strideList[i+numStridesC], WSstrides[i]) - for i in range(numStridesC*2, len(self.strideList)): - s += "%shipFunctionArgs.%s = %s;\n" % (t, self.strideList[i], self.strideList[i]) - else: - for stride in self.strideList: - s += "%shipFunctionArgs.%s = %s;\n" % (t, stride, stride) - # sizes - for i in range(0, problemType["TotalIndices"]): - lastParam = i == problemType["TotalIndices"]-1 - s += "%shipFunctionArgs.size%s = sizes[kernelIdx][enqueueIdx][%u];\n" \ - % (t, globalParameters["IndexChars"][i], i ) - - s += "%shipFunctionArgs.tensor2dSizeC = tensor2dSizeC;\n" % (t) - s += "%shipFunctionArgs.tensor2dSizeA = tensor2dSizeA;\n" % (t) - s += "%shipFunctionArgs.tensor2dSizeB = tensor2dSizeB;\n" % (t) - - s += "%shipFunctionArgs.staggerUIter = staggerUIter;\n" % (t) - # persistent - pass in the number of tiles in problem since not available in WG - s += "\n" - s += "%shipFunctionArgs.problemNumGroupTiles0 = problemNumGroupTiles0;\n" % (t) - s += "%shipFunctionArgs.problemNumGroupTiles1 = problemNumGroupTiles1;\n" % (t) - s += "%shipFunctionArgs.magicNumberProblemNumGroupTiles0 = magicNumberProblemNumGroupTiles0;\n" % (t) - s += "%shipFunctionArgs.gridNumWorkGroups0 = globalWorkSize[kernelIdx][0];\n" % (t) # - s += "%shipFunctionArgs.numFullBlocks = numFullBlocks;\n" % (t) - s += "%shipFunctionArgs.wgmRemainder1 = wgmRemainder1;\n" % (t) - s += "%shipFunctionArgs.magicNumberWgmRemainder1 = magicNumberWgmRemainder1;\n" % (t) - - # Magic numbers for packed indices: - for idxChar in solution["PackedC0IdxChars"][:-1]: - s += "%shipFunctionArgs.magicNumberSize%s = static_cast(magicNumberSize%s);\n" % (t, idxChar, idxChar) - s += "%shipFunctionArgs.magicShiftSize%s = magicShiftSize%s;\n" % (t, idxChar, idxChar) - for idxChar in solution["PackedC1IdxChars"][:-1]: - s += "%shipFunctionArgs.magicNumberSize%s = static_cast(magicNumberSize%s);\n" % (t, idxChar, idxChar) - s += "%shipFunctionArgs.magicShiftSize%s = magicShiftSize%s;\n" % (t, idxChar, idxChar) - if globalParameters["LibraryPrintDebug"]: - s += """ - std::vector tmp(hipFunctionArgsSize); - memcpy(tmp.data(), &hipFunctionArgs, hipFunctionArgsSize); - for(int i = 0; i < hipFunctionArgsSize; i++) - { - if(i % 8 == 0) printf("\\n"); - - printf("%02hhx", tmp[i]); - } - printf("\\n"); - """ - - s += "%skernelsLaunched++;\n" % (t) - s += "%shipExtModuleLaunchKernel(\n" % (t) - t += " " - s += "%shipFunction,\n" % (t) - s += "%sglobalWorkSize[kernelIdx][0]*localWorkSize[0],\n" % (t) - s += "%sglobalWorkSize[kernelIdx][1]*localWorkSize[1],\n" % (t) - s += "%sglobalWorkSize[kernelIdx][2]*localWorkSize[2],\n" % (t) - s += "%slocalWorkSize[0],\n" % (t) - s += "%slocalWorkSize[1],\n" % (t) - s += "%slocalWorkSize[2],\n" % (t) - s += "%s0, // groupMemBytes\n" % (t) - s += "%sstream,\n" % (t) - s += "%sNULL,\n" % (t) - s += "%s(void**)hipLaunchParams\n" % (t) - if globalParameters["PreciseKernelTime"]: - if gsu > 1 and kernel["_GlobalAccumulation"] != 'MultipleBuffer': - s += "%s,nullptr\n" %(t) - else: - s += "%s,inputEvents ? inputEvents[enqueueIdx]:nullptr\n" %(t) - if solution["_GlobalAccumulation"]: - s += "%s,nullptr\n" % (t) - else: - s += "%s,outputEvent ? outputEvent[enqueueIdx]:nullptr\n" % (t) - - s += "%s);\n" % (t) - t = t[2:] - if globalParameters["DebugKernel"]: - # copy debug buffer - s += "%shipMemcpyDtoH(debugBufferHostPtr, hipFunctionArgs.debugBuffer, debugBufferSize);\n" % (t) - s += "%sfor(unsigned int i = 0; i < debugBufferNumElem/debugBufferElementsPerThread; i++) {\n" % (t) - s += "%s printf(\"%%04i\", i);\n" % (t) - s += "%s char u[debugBufferElementsPerThread] = {1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1};\n" % (t) - #s += "%s char u[debugBufferElementsPerThread] = {0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0};\n" % (t) - #s += "%s char u[debugBufferElementsPerThread] = {1,1,0,0,1,1,0,0,1,1,1,1,1,1,1,1};\n" % (t) - s += "%s for(unsigned int j = 0; j < debugBufferElementsPerThread; j++) {\n" % (t) - s += "%s if (u[j]) printf(\",%%4u\", debugBufferHostPtr[i*debugBufferElementsPerThread+j]);\n" % (t) - s += "%s else printf(\",%%4.0f\", ((float *)debugBufferHostPtr)[i*debugBufferElementsPerThread+j]);\n" % (t) - - s += "%s }\n" % (t) - s += "%s printf(\"\\n\");\n" % (t) - s += "%s}\n" % (t) - - - t = t[2:] - s += "%s} catch (const std::exception& e) {\n" % (t) - s += "#ifdef DEBUG\n" - s += "%s std::cerr << e.what() << std::endl;\n" % (t) - s += "#endif\n" - s += "%s return tensileStatusFailure;\n" % (t) - s += "%s}\n" % (t) - if not globalParameters["PreciseKernelTime"] or kernelLanguage == "Source": - s += "%sif( outputEvent != NULL )\n" % (t) - s += "%s hipEventRecord(outputEvent[enqueueIdx], stream );\n" % (t) - s += " }\n" - t = t[2:] - - - ################################################### - # Enqueue Kernel for Global Accumultation Buffer - ################################################### - if solution["_GlobalAccumulation"]: - for ko in solution.getKernelConversionObjects(): - kernelName = ko.getKernelName() - s += "%s// enqueue GSU third kernel\n" % (t) - - # grid sizes - s += "%ssize_t localWorkSizeGlobalAccum[3] = { 256, 1, 1};\n" % (t) - s += "%ssize_t globalWorkSizeGlobalAccum[3] = { 1, 1, 1};\n" % (t) - s += "%sglobalWorkSizeGlobalAccum[0] = (sizeOfC + localWorkSizeGlobalAccum[0] - 1) / localWorkSizeGlobalAccum[0];\n" % (t) - s += "%s// b/c single kernel, add extra work-group here if edge needed\n" % (t) - - s += "%stry {\n" % (t) - t += " " - # TODO - timing with beta kernels is somewhat pessimistic since it has this separate event only on the GSU path. - # Introduces 2-3us of overhead ; may want to disable PreciseKernelTime so non-GSU have same overhead. - # Long-term fix would be to launch the beta kernel with the hipHccModule* API and set start-event in that call - s += "%skernelsLaunched++;\n" % (t) - s += "%shipLaunchKernelGGL(\n" % (t) - t += " " - s += "%sHIP_KERNEL_NAME(%s),\n" % (t, kernelName) - s += "%sdim3(globalWorkSizeGlobalAccum[0], globalWorkSizeGlobalAccum[1], globalWorkSizeGlobalAccum[2]),\n" % (t) - s += "%sdim3(localWorkSizeGlobalAccum[0], localWorkSizeGlobalAccum[1], localWorkSizeGlobalAccum[2]),\n" % (t) - s += "%s0, // groupMemBytes\n" % (t) - s += "%sstream,\n" % (t) - s += "%sdataD,\n" % (t) - s += "%sworkspace,\n" % (t) - s += "%sdataC,\n" % (t) - s += "%s%s,\n" % (t, "alpha" if kernel["_GlobalAccumulation"] == 'MultipleBuffer' else "1") - s += "%s%s,\n" % (t, "beta" if (kernel["_GlobalAccumulation"] == 'MultipleBuffer' and problemType["UseBeta"]) else "0") - # strides - for i in range(0, numStridesC): - s += "%s%s,\n" % (t, self.strideList[i]) - for i in range(0, numStridesC): - s += "%s%s,\n" % (t, WSstrides[i]) - for i in range(numStridesC, numStridesC*2): - s += "%s%s,\n" % (t, self.strideList[i]) - # sizes - for i in range(0, problemType["NumIndicesC"]): - s += "%ssize%s%s" % (t, self.indexChars[i], ",\n") - s += "%s%u);\n" % (t, (solution["GlobalSplitU"] if kernel["_GlobalAccumulation"] == 'MultipleBuffer' else 1)) - t = t[:-2] - s += "%sif( outputEvent != NULL )\n" % (t) - s += "%s hipEventRecord(outputEvent[0], stream );\n" % (t) - t = t[:-2] - s += "%s} catch (const std::exception& e) {\n" % (t) - s += "#ifdef DEBUG\n" - s += "%s std::cerr << e.what() << std::endl;\n" % (t) - s += "#endif\n" - s += "%s return tensileStatusFailure;\n" % (t) - s += "%s}\n" % (t) - - s += "\n" - s += " return tensileStatusSuccess;\n" - s += "}\n" - s += "\n" - s += "/* Solution Parameters\n" - s += Solution.getParametersIndented(solution.getAttributes(), " ") - s += "*/\n" - s += "\n" - - return s - - - ############################################################################## - # getHeaderString - ############################################################################## - def getHeaderString(self, solution): - s = "" - if not globalParameters["MergeFiles"] or globalParameters["NumMergedFiles"] > 1: - s += "#pragma once\n\n" - s += "#include \"TensileTypes.h\"\n" - s += "#include \"SolutionHelper.h\"\n" - s += "#include \"Tools.h\"\n" - s += "\n" - - # include kernels - for kernel in solution.getKernels(): - if kernel != None: - kernelName = self.kernelWriter.getKernelName(kernel) - s += "#include \"" + kernelName + ".h\"\n" - for ko in solution.getHelperKernelObjects(): - kernelName = ko.getKernelName() - s += "#include \"" + kernelName + ".h\"\n" - - s += "\n" - - # function declaration - s += self.getSolutionSignature(solution, header=True) + ";\n" - s += "\n" - #s += "#endif\n" - s += "\n" - return s - - ######################################## - # get solution arguments - # includeData adds launch-time info including data pointers and solution index - def getArgList(self, problemType, includeSolutionInfo, includeData, includeEvents, includeStream, includeGlobalAccumBuffer=False, GlobalAccumKernel=False): - self.strideList = [] - self.sizeList = [] - argList = [] - - if includeSolutionInfo: - argList.append(("SolutionLock *", "solutionLock", "nullptr")) - # argList.append(("const char *", "kernelName2")) - # argList.append(("const unsigned char *", "kernelCoba")) - - # data ptrs - if includeData: - typeName = problemType["DataType"].toCpp() - destTypeName = problemType["DestDataType"].toCpp() - computeTypeName = problemType["ComputeDataType"].toCpp() - if self.language == "HIP": - if GlobalAccumKernel: - argList.append(("float *", "dataD", "nullptr")) - argList.append(("const float *", "dataC", "nullptr")) - else: - argList.append(("%s *"%destTypeName, "dataD", "nullptr")) - argList.append(("const %s *"%destTypeName, "dataC", "nullptr")) - argList.append(("const %s *"%typeName, "dataA", "nullptr")) - argList.append(("const %s *"%typeName, "dataB", "nullptr")) - else: - argList.append(("cl_mem", "dataD", "nullptr")) - argList.append(("cl_mem", "dataC", "nullptr")) - argList.append(("cl_mem", "dataA", "nullptr")) - argList.append(("cl_mem", "dataB", "nullptr")) - argList.append((computeTypeName, "alpha", "%s()"%computeTypeName)) - if problemType["UseBeta"]: - argList.append((computeTypeName, "beta", "%s()"%computeTypeName)) - - # initial strides ? - firstStrideAB = firstStrideCD = 1 - if problemType["UseInitialStridesAB"]: - firstStrideAB = 0 - if problemType["UseInitialStridesCD"]: - firstStrideCD = 0 - lastStrideC = problemType["NumIndicesC"] - lastStrideA = len(problemType["IndexAssignmentsA"]) - lastStrideB = len(problemType["IndexAssignmentsB"]) - # d strides - for i in range(firstStrideCD,lastStrideC): - self.strideList.append("strideD%u%s" % (i, self.indexChars[i])) - # c strides - for i in range(firstStrideCD,lastStrideC): - self.strideList.append("strideC%u%s" % (i, self.indexChars[i])) - # a strides - for i in range(firstStrideAB,lastStrideA): - self.strideList.append("strideA%u%s" % (i, \ - self.indexChars[problemType["IndexAssignmentsA"][i]])) - # b strides - for i in range(firstStrideAB,lastStrideB): - self.strideList.append("strideB%u%s" % (i, \ - self.indexChars[problemType["IndexAssignmentsB"][i]])) - # c sizes - for i in range(0,problemType["TotalIndices"]): - self.sizeList.append("size%s" % self.indexChars[i]) - for stride in self.strideList: - argList.append(("unsigned int", stride, 0)) - for size in self.sizeList: - argList.append(("unsigned int", size, 0)) - if includeStream: - argList.append((self.streamName, "stream", "nullptr")) - if includeEvents: - argList.append(("unsigned int", "numInputEvents", 0)) - argList.append(("%s *"%self.eventName, "inputEvents", "nullptr")) - argList.append(("%s *"%self.eventName, "outputEvent", "nullptr")) - - if includeData: - if self.language == "HIP": - if includeGlobalAccumBuffer: - argList.append(("float *", "workspace", "nullptr")) - - return argList - - ######################################## - # get function signature - def getSolutionSignature(self, solution, header=False): - t = "" # indent - s = "" - solutionName = self.getSolutionName(solution) - s += "%s%s %s(\n" % (t, self.statusName, solutionName) - t += " " - argList = self.getArgList(solution["ProblemType"], True, True, True, True, True) - for i in range(0, len(argList)): - argString = "%s %s = %s" % argList[i] if header else "%s %s" % (argList[i][0], argList[i][1]) - s += "%s%s%s" % (t, argString, ",\n" if i < len(argList)-1 else ")" ) - return s - - ######################################## - # get full header code - # called from BenchmarkProblems - def getHeaderFileString(self, solution): - fileStr = "" # CHeader - fileStr += self.getHeaderString(solution) - return fileStr - - diff --git a/Tensile/TensileCreateLibrary.py b/Tensile/TensileCreateLibrary.py index dae1d0502..f28ba3119 100644 --- a/Tensile/TensileCreateLibrary.py +++ b/Tensile/TensileCreateLibrary.py @@ -39,7 +39,6 @@ from .KernelWriterSource import KernelWriterSource from .SolutionLibrary import MasterSolutionLibrary from .SolutionStructs import Solution -from .SolutionWriter import SolutionWriter import argparse import collections @@ -480,8 +479,8 @@ def buildKernelSourceAndHeaderFiles(results, outputPath, kernelsWithBuildErrs): ################################################################################ # Write Solutions and Kernels for BenchmarkClient or LibraryClient ################################################################################ -def writeSolutionsAndKernels(outputPath, CxxCompiler, problemTypes, solutions, kernels, kernelHelperObjs, \ - solutionWriter, kernelWriterSource, kernelWriterAssembly, errorTolerant=False): +def writeKernels(outputPath, CxxCompiler, problemTypes, solutions, kernels, kernelHelperObjs, \ + kernelWriterSource, kernelWriterAssembly, errorTolerant=False): start = time.time() codeObjectFiles = [] @@ -625,19 +624,17 @@ def success(kernel): ############################################################################## # Min Naming / Solution and Kernel Writers ############################################################################## -def getSolutionAndKernelWriters(solutions, kernels): +def getKernelWriters(solutions, kernels): # if any kernels are assembly, append every ISA supported - solutionSerialNaming = Solution.getSerialNaming(solutions) kernelSerialNaming = Solution.getSerialNaming(kernels) solutionMinNaming = Solution.getMinNaming(solutions) kernelMinNaming = Solution.getMinNaming(kernels) - solutionWriter = SolutionWriter(solutionMinNaming, solutionSerialNaming, kernelMinNaming, kernelSerialNaming) kernelWriterSource = KernelWriterSource(kernelMinNaming, kernelSerialNaming) kernelWriterAssembly = KernelWriterAssembly(kernelMinNaming, kernelSerialNaming) - return (solutionWriter, kernelWriterSource, kernelWriterAssembly, kernelMinNaming, solutionMinNaming) + return (kernelWriterSource, kernelWriterAssembly, kernelMinNaming, solutionMinNaming) ################################################################################ # copy static cpp files and headers @@ -659,7 +656,7 @@ def copyStaticFiles(outputPath=None): return libraryStaticFiles -def buildObjectFileNames(solutionWriter, kernelWriterSource, kernelWriterAssembly, solutions, kernels, kernelHelperObjs): +def buildObjectFileNames(kernelWriterSource, kernelWriterAssembly, solutions, kernels, kernelHelperObjs): # Build lists of output object names sourceKernelNames = [] @@ -975,14 +972,14 @@ def writeBenchmarkClientFiles(libraryWorkingPath, tensileSourcePath, solutions, copyStaticFiles(libraryWorkingPath) kernels, kernelsBetaOnly, _ = generateKernelObjectsFromSolutions(solutions) - solutionWriter, kernelWriterSource, kernelWriterAssembly, \ - kernelMinNaming, _ = getSolutionAndKernelWriters(solutions, kernels) + kernelWriterSource, kernelWriterAssembly, \ + kernelMinNaming, _ = getKernelWriters(solutions, kernels) # write solution, kernels and CMake problemType = solutions[0]["ProblemType"] - codeObjectFiles = writeSolutionsAndKernels( \ + codeObjectFiles = writeKernels( \ libraryWorkingPath, cxxCompiler, [problemType], solutions, kernels, kernelsBetaOnly, \ - solutionWriter, kernelWriterSource, kernelWriterAssembly, errorTolerant=True ) + kernelWriterSource, kernelWriterAssembly, errorTolerant=True ) newLibraryDir = ensurePath(os.path.join(libraryWorkingPath, 'library')) newLibraryFile = os.path.join(newLibraryDir, "TensileLibrary.yaml") @@ -1180,8 +1177,8 @@ def splitExtraParameters(par): kernels, kernelHelperObjs, _ = generateKernelObjectsFromSolutions(solutions) # if any kernels are assembly, append every ISA supported - solutionWriter, kernelWriterSource, kernelWriterAssembly, \ - kernelMinNaming, _ = getSolutionAndKernelWriters(solutions, kernels) + kernelWriterSource, kernelWriterAssembly, \ + kernelMinNaming, _ = getKernelWriters(solutions, kernels) staticFiles = copyStaticFiles(outputPath) @@ -1190,7 +1187,7 @@ def splitExtraParameters(par): sourceKernelFiles, asmKernelFiles, sourceLibFiles, - asmLibFiles) = buildObjectFileNames(solutionWriter, kernelWriterSource, \ + asmLibFiles) = buildObjectFileNames(kernelWriterSource, \ kernelWriterAssembly, solutions, kernels, kernelHelperObjs) (_, @@ -1224,8 +1221,8 @@ def splitExtraParameters(par): outputPath ) # write solutions and kernels - codeObjectFiles = writeSolutionsAndKernels(outputPath, CxxCompiler, None, solutions, - kernels, kernelHelperObjs, solutionWriter, kernelWriterSource, kernelWriterAssembly) + codeObjectFiles = writeKernels(outputPath, CxxCompiler, None, solutions, + kernels, kernelHelperObjs, kernelWriterSource, kernelWriterAssembly) bothLibSet = set(sourceLibPaths + asmLibPaths) setA = set( map( os.path.normcase, set(codeObjectFiles) ) ) diff --git a/Tensile/Tests/unit/test_TensileCreateLibrary.py b/Tensile/Tests/unit/test_TensileCreateLibrary.py index 37d488df0..8e391402a 100644 --- a/Tensile/Tests/unit/test_TensileCreateLibrary.py +++ b/Tensile/Tests/unit/test_TensileCreateLibrary.py @@ -50,20 +50,8 @@ def test_loadSolutions(caplog, useGlobalParameters): assert len(kernels) == 3 - solutionWriter, _, kernelWriterAssembly, \ - _, _ = TensileCreateLibrary.getSolutionAndKernelWriters(solutions, kernels) - - expectedSolutionName0 = "Cijk_Ailk_Bljk_SB_MT128x128x2_SE_TT8_8_WG16_16_1" - expectedSolutionName1 = "Cijk_Ailk_Bljk_SB_MT64x64x2_SE_TT4_4_WG16_16_1" - expectedSolutionName2 = "Cijk_Ailk_Bljk_SB_MT64x64x2_SE_TT4_8_WG16_8_1" - - actualSolutionName0 = solutionWriter.getSolutionName(solutions[0]) - actualSolutionName1 = solutionWriter.getSolutionName(solutions[1]) - actualSolutionName2 = solutionWriter.getSolutionName(solutions[2]) - - assert expectedSolutionName0 == actualSolutionName0 - assert expectedSolutionName1 == actualSolutionName1 - assert expectedSolutionName2 == actualSolutionName2 + _, kernelWriterAssembly, \ + _, _ = TensileCreateLibrary.getKernelWriters(solutions, kernels) expectedKernelName0 = "Cijk_Ailk_Bljk_SB_MT128x128x2_SE_K1_TT8_8_WG16_16_1" expectedKernelName1 = "Cijk_Ailk_Bljk_SB_MT64x64x2_SE_K1_TT4_4_WG16_16_1" From 007986b61d576f1444a738bdb66cead26a2eb465 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Thu, 14 Dec 2023 17:53:58 -0700 Subject: [PATCH 21/51] Remove WGM related kernargs if they are not needed (#1844) --- Tensile/Components/Signature.py | 7 ++++--- Tensile/KernelWriterAssembly.py | 11 +++++++---- Tensile/Source/lib/source/ContractionSolution.cpp | 9 ++++++--- 3 files changed, 17 insertions(+), 10 deletions(-) diff --git a/Tensile/Components/Signature.py b/Tensile/Components/Signature.py index 557835e2d..2a5ca9b28 100644 --- a/Tensile/Components/Signature.py +++ b/Tensile/Components/Signature.py @@ -293,9 +293,10 @@ def __call__(self, writer): kStr += self.addArgument("skExtraIters", '4', offset,"by_value", "u32"); offset += 4 # kStr += self.addArgument("dpTilesPerWG", '4', offset,"by_value", "u32"); offset += 4 - kStr += self.addArgument( "NumFullBlocks", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "WgmRemainder1", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "MagicNumberWgmRemainder1", '4', offset, "by_value", "u32"); offset += 4 + if abs(kernel["WorkGroupMapping"]) > 1: + kStr += self.addArgument( "NumFullBlocks", '4', offset, "by_value", "u32"); offset += 4 + kStr += self.addArgument( "WgmRemainder1", '4', offset, "by_value", "u32"); offset += 4 + kStr += self.addArgument( "MagicNumberWgmRemainder1", '4', offset, "by_value", "u32"); offset += 4 # for in-device stochastic rounding, iwe need to pass Seed # TODO: if kernel["ProblemType"]["StochasticRounding"] == 1: # in-device diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 46b5608bf..8153375f3 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -1939,9 +1939,12 @@ def initKernel(self, kernel, tPA, tPB ): # Mostly impacts flat kernels and GSU edge since these need SGPR # for conditionals self.lastPostLoopSgpr = self.sgprPool.size() - self.defineSgpr("NumFullBlocks", 1) # Magic number to use for div by (NumWorkGroups1 % WGM) - self.defineSgpr("WgmRemainder1", 1) # Magic number to use for div by (NumWorkGroups1 % WGM) - self.defineSgpr("MagicNumberWgmRemainder1", 1) # Magic number to use for div by (NumWorkGroups1 % WGM) + self.numSgprWGM = 0 + if abs(kernel["WorkGroupMapping"]) > 1: + self.numSgprWGM = 3 + self.defineSgpr("NumFullBlocks", 1) # Magic number to use for div by (NumWorkGroups1 % WGM) + self.defineSgpr("WgmRemainder1", 1) # Magic number to use for div by (NumWorkGroups1 % WGM) + self.defineSgpr("MagicNumberWgmRemainder1", 1) # Magic number to use for div by (NumWorkGroups1 % WGM) # SR only for F8 type if kernel["ProblemType"]["DataType"].is8bitFloat(): @@ -1972,7 +1975,7 @@ def initKernel(self, kernel, tPA, tPB ): 2 + \ pkArgumentToLoad + \ skArgumentToLoad + \ - 3 + \ + self.numSgprWGM + \ self.numSgprOffsetD + self.numSgprOffsetC + self.numSgprOffsetA + self.numSgprOffsetB # SR only for F8 type diff --git a/Tensile/Source/lib/source/ContractionSolution.cpp b/Tensile/Source/lib/source/ContractionSolution.cpp index 161d3eca7..aef694c6e 100644 --- a/Tensile/Source/lib/source/ContractionSolution.cpp +++ b/Tensile/Source/lib/source/ContractionSolution.cpp @@ -674,9 +674,12 @@ namespace Tensile magicNumberWgmRemainder1 = smallMagicNumber(wgmRemainder1); } - rv.args.append("numFullBlocks", numFullBlocks); - rv.args.append("wgmRemainder1", wgmRemainder1); - rv.args.append("magicNumberWgmRemainder1", magicNumberWgmRemainder1); + if(std::abs(sizeMapping.workGroupMapping) > 1) + { + rv.args.append("numFullBlocks", numFullBlocks); + rv.args.append("wgmRemainder1", wgmRemainder1); + rv.args.append("magicNumberWgmRemainder1", magicNumberWgmRemainder1); + } } if(problemType.stochasticRounding) From 670900eccbcf511728859814a56c3846e00597fb Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Fri, 15 Dec 2023 16:39:23 -0700 Subject: [PATCH 22/51] Test limiting CI threads for only gfx11 (#1849) --- .jenkins/common.groovy | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/.jenkins/common.groovy b/.jenkins/common.groovy index 96561b377..e24a645c4 100644 --- a/.jenkins/common.groovy +++ b/.jenkins/common.groovy @@ -35,6 +35,9 @@ def runCompileCommand(platform, project, jobName, boolean debug=false) // avoid bug causing long build times of certain files. String buildType = 'Release' // debug ? 'Debug' : 'RelWithDebInfo' String parallelJobs = "export HIPCC_COMPILE_FLAGS_APPEND='-O3 -Wno-format-nonliteral -parallel-jobs=4'" + String buildThreads = '-1' // if hipcc is used may be multiplied by parallel-jobs + if (platform.jenkinsLabel.contains('gfx11')) + buildThreads = '16' // comment @@ -62,7 +65,7 @@ def runCompileCommand(platform, project, jobName, boolean debug=false) pushd build export PATH=/opt/rocm/bin:\$PATH - cmake -DCMAKE_BUILD_TYPE=${buildType} -DCMAKE_CXX_COMPILER=${compiler} -DTensile_ROOT=\$(pwd)/../Tensile ../HostLibraryTests + cmake -DCMAKE_BUILD_TYPE=${buildType} -DCMAKE_CXX_COMPILER=${compiler} -DTensile_CPU_THREADS=${buildThreads} -DTensile_ROOT=\$(pwd)/../Tensile ../HostLibraryTests NPROC_BUILD=16 if [ `nproc` -lt 16 ] then From 6acff08cd300347b3ecf83e7804a2cf164aa3c26 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Tue, 19 Dec 2023 09:05:33 -0700 Subject: [PATCH 23/51] Fix HostLibraryTests on gfx942 and gfx941 (#1851) --- .../aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml | 11947 ++++++++++ .../aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml | 11955 ++++++++++ .../aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml | 11955 ++++++++++ .../aquavanjaram941_Cijk_Alik_Bljk_SB.yaml | 12161 ++++++++++ .../aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml | 11947 ++++++++++ .../aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml | 11955 ++++++++++ .../aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml | 11955 ++++++++++ .../aquavanjaram942_Cijk_Alik_Bljk_SB.yaml | 12161 ++++++++++ .../aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml | 19425 ++++++++++++++++ .../aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml | 18412 +++++++++++++++ .../aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml | 19013 +++++++++++++++ .../aquavanjaram941_Cijk_Alik_Bljk_SB.yaml | 19239 +++++++++++++++ .../aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml | 19425 ++++++++++++++++ .../aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml | 18412 +++++++++++++++ .../aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml | 19013 +++++++++++++++ .../aquavanjaram942_Cijk_Alik_Bljk_SB.yaml | 19239 +++++++++++++++ .../aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml | 1379 ++ .../aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml | 1379 ++ .../aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml | 1379 ++ .../aquavanjaram941_Cijk_Alik_Bljk_SB.yaml | 1815 ++ .../aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml | 1379 ++ .../aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml | 1379 ++ .../aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml | 1379 ++ .../aquavanjaram942_Cijk_Alik_Bljk_SB.yaml | 1815 ++ 24 files changed, 260118 insertions(+) create mode 100644 HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml create mode 100644 HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml create mode 100644 HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml diff --git a/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml b/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml new file mode 100644 index 000000000..0ea8131a6 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml @@ -0,0 +1,11947 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 16 + LSPB: 8 + LVCA: 16 + LVCB: 32 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 128 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 8 + LSPB: 16 + LVCA: 32 + LVCB: 16 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 704 + - - 0 + - 2919.39 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1408 + - - 3 + - 3965.21 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 3399.4 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1856 + - - 3 + - 3677.9 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 704 + - - 2 + - 4025.67 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1856 + - - 1 + - 4099.34 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 704 + - 128 + - - 5 + - 687.223 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 448 + - - 0 + - 3882.38 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1024 + - - 2 + - 2991.29 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 3361.73 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 256 + - - 3 + - 3403.36 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 3584 + - - 4 + - 4166.96 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1856 + - - 5 + - 882.062 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 128 + - - 5 + - 2048.56 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 6784 + - - 1 + - 4227.19 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 64 + - - 0 + - 2273.46 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 4 + - 6784 + - - 6 + - 194.253 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 5888 + - - 0 + - 3475.26 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 5056 + - - 4 + - 4213.88 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 448 + - - 0 + - 4202.37 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1856 + - - 2 + - 4153.36 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 2368 + - - 0 + - 3619.5 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 6784 + - - 3 + - 3128.03 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 4 + - - 6 + - 149.186 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 128 + - - 0 + - 2511.61 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1408 + - - 6 + - 39.7262 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1856 + - - 5 + - 4017.34 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 4288 + - - 4 + - 4130.97 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 64 + - 5888 + - - 0 + - 1980.08 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 64 + - 64 + - - 5 + - 41.1402 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2944 + - - 3 + - 2489.92 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3287.9 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 6784 + - - 1 + - 4140.0 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1024 + - - 5 + - 3273.89 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3470.26 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 448 + - - 5 + - 3790.78 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3584 + - - 6 + - 128.44 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1024 + - - 2 + - 3437.89 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1856 + - - 3 + - 4009.11 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 669.456 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 2944 + - - 2 + - 4215.74 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 2944 + - - 3 + - 3651.59 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 4 + - - 6 + - 161.666 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 6784 + - - 4 + - 4422.41 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1024 + - - 6 + - 38.4202 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1856 + - - 3 + - 3710.2 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 5888 + - - 6 + - 196.019 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 471.175 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 3584 + - - 4 + - 4043.78 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1024 + - - 5 + - 3721.51 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 5056 + - - 1 + - 4197.94 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1408 + - - 3 + - 3770.16 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 128 + - - 5 + - 1559.53 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 4 + - - 6 + - 5.6044 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 4 + - 704 + - - 6 + - 21.193 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 64 + - - 5 + - 940.711 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 704 + - 6784 + - - 3 + - 3800.68 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 704 + - - 0 + - 525.528 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 4 + - - 6 + - 160.47 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 4 + - 2944 + - - 6 + - 83.1375 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 3 + - 2502.66 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3773.07 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 6784 + - - 1 + - 4366.11 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 704 + - 4 + - - 6 + - 20.9987 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 4288 + - - 4 + - 4129.09 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 64 + - - 0 + - 333.558 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 64 + - - 5 + - 789.73 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 2944 + - - 1 + - 4258.3 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 128 + - - 3 + - 3066.76 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 704 + - 704 + - - 5 + - 2265.32 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1408 + - - 5 + - 4027.4 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 4288 + - - 0 + - 4095.44 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 2368 + - - 3 + - 4148.74 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 5056 + - - 4 + - 4267.51 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 5888 + - - 3 + - 3943.23 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 704 + - 704 + - - 5 + - 1764.42 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 256 + - 448 + - - 5 + - 1189.51 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 2368 + - - 5 + - 3576.62 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5056 + - - 3 + - 3022.54 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 2368 + - - 6 + - 86.8332 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1408 + - - 3 + - 4153.8 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3584 + - - 4 + - 4219.31 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 3584 + - - 5 + - 3646.0 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 2368 + - - 3 + - 4137.56 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1024 + - - 4 + - 3614.3 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 2368 + - - 3 + - 3987.25 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1856 + - - 5 + - 2304.16 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 64 + - - 0 + - 3547.32 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 4288 + - - 5 + - 2766.27 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 448 + - - 5 + - 334.09 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 8.75529 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 256 + - - 5 + - 2169.37 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 128 + - 448 + - - 0 + - 443.741 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 448 + - 2944 + - - 3 + - 3463.05 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 448 + - - 5 + - 4088.07 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 2944 + - - 1 + - 3992.62 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 704 + - 6784 + - - 3 + - 3982.47 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 64 + - 2944 + - - 5 + - 1284.11 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 5056 + - - 5 + - 2771.32 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1024 + - - 2 + - 3487.93 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3806.84 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 1925.42 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 2944 + - - 3 + - 3911.12 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 448 + - - 3 + - 3083.38 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 704 + - - 3 + - 3828.1 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 704 + - - 0 + - 3364.48 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 2368 + - - 3 + - 3930.02 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 448 + - - 0 + - 3522.83 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 448 + - 448 + - - 5 + - 1344.94 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 4288 + - - 1 + - 4182.27 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 5888 + - - 1 + - 4196.28 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 2944 + - - 0 + - 3188.23 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 448 + - - 3 + - 2522.12 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 8.91734 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 5056 + - - 4 + - 4422.36 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1856 + - - 3 + - 3887.18 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 6784 + - - 0 + - 3903.22 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1408 + - - 3 + - 3687.66 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 5056 + - - 4 + - 4181.82 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 64 + - - 0 + - 2370.45 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 128 + - 2368 + - - 5 + - 1645.26 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 5888 + - - 2 + - 4314.85 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1856 + - - 0 + - 2409.83 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 64 + - - 5 + - 1433.88 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 128 + - 64 + - - 5 + - 63.5965 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 191.553 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 4 + - - 6 + - 193.292 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 11.4122 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 4288 + - - 3 + - 4153.91 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 128 + - - 6 + - 5.74574 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 6784 + - - 1 + - 4401.5 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 256 + - 2368 + - - 0 + - 2606.89 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 704 + - - 5 + - 3956.89 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 6784 + - - 1 + - 4362.62 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 448 + - - 3 + - 2147.97 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1024 + - - 3 + - 3002.64 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1856 + - - 3 + - 4045.93 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1024 + - - 2 + - 3822.18 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 6784 + - - 5 + - 4049.53 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1408 + - - 3 + - 4054.63 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 704 + - 4288 + - - 3 + - 3367.98 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 64 + - - 5 + - 1737.41 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 2944 + - - 0 + - 3102.42 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1856 + - - 3 + - 3245.54 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1856 + - - 6 + - 51.8408 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 0 + - 257.341 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 256 + - - 5 + - 199.222 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 4 + - - 6 + - 51.9996 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 704 + - 2368 + - - 3 + - 3029.67 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 5888 + - - 1 + - 4363.5 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 704 + - - 2 + - 3966.3 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3242.83 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 704 + - - 5 + - 2153.58 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 5888 + - - 2 + - 4119.9 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 2944 + - - 3 + - 3977.27 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 64 + - 704 + - - 5 + - 347.421 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 5056 + - - 5 + - 2791.61 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 4 + - - 6 + - 0.181457 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1024 + - - 6 + - 37.9774 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 3584 + - - 2 + - 4350.48 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 4 + - - 6 + - 137.692 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1024 + - - 0 + - 1341.28 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 3584 + - - 1 + - 4245.11 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 128 + - - 5 + - 1799.74 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 128 + - 5888 + - - 3 + - 2935.41 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 64 + - 448 + - - 0 + - 223.673 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 64 + - - 5 + - 680.013 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 4 + - - 6 + - 168.606 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 6784 + - - 0 + - 3658.8 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 6784 + - - 4 + - 4213.36 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 704 + - 4 + - - 6 + - 27.6418 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 4288 + - - 4 + - 4214.89 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 64 + - - 5 + - 490.142 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 4 + - - 6 + - 99.326 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 64 + - - 5 + - 1537.3 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 128 + - - 5 + - 2278.34 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 704 + - 448 + - - 5 + - 1704.64 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 128 + - - 5 + - 95.7 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 2944 + - - 1 + - 3968.33 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 4288 + - - 5 + - 2277.51 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2368 + - - 3 + - 2056.4 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 5888 + - - 3 + - 4018.88 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 859.223 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 10.6206 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 64 + - - 0 + - 3712.23 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 2368 + - - 3 + - 4076.08 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 5056 + - - 1 + - 4312.58 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 3584 + - - 4 + - 3394.7 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 5888 + - - 4 + - 4311.26 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 5888 + - - 3 + - 4107.54 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1024 + - - 6 + - 28.4982 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 5056 + - - 4 + - 4136.75 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 2944 + - - 0 + - 3243.99 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 448 + - - 0 + - 2389.52 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 64 + - 4288 + - - 5 + - 2038.08 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 5 + - 1920.05 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 256 + - 2944 + - - 3 + - 2934.06 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 2368 + - - 5 + - 4108.74 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1024 + - - 5 + - 791.749 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 448 + - - 3 + - 3360.26 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 2368 + - - 6 + - 84.147 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 128 + - 5056 + - - 3 + - 2191.32 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 704 + - 3584 + - - 0 + - 3426.21 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 2680.25 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1408 + - - 3 + - 3673.83 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 4 + - - 6 + - 166.453 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1408 + - - 3 + - 2373.74 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1856 + - - 2 + - 3912.6 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 256 + - 128 + - - 5 + - 343.771 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1408 + - - 5 + - 3792.27 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 448 + - - 6 + - 19.7668 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 6784 + - - 0 + - 3783.6 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 2944 + - - 5 + - 2129.29 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 5056 + - - 3 + - 4049.81 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 198.595 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 448 + - 6784 + - - 3 + - 3388.94 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1024 + - - 4 + - 3246.95 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 704 + - - 5 + - 3735.54 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1856 + - - 3 + - 3963.13 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 5888 + - - 4 + - 4253.42 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 704 + - - 3 + - 3642.9 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1856 + - - 3 + - 3856.09 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1408 + - - 3 + - 3868.6 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1408 + - - 5 + - 939.01 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 256 + - - 5 + - 1945.21 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 704 + - 3584 + - - 1 + - 3165.88 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3584 + - - 0 + - 3983.17 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 4288 + - - 0 + - 3524.27 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 2944 + - - 1 + - 4222.0 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 704 + - - 5 + - 546.677 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 2368 + - - 0 + - 2868.13 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 64 + - - 5 + - 2751.86 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 2368 + - - 1 + - 4161.93 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 6784 + - - 1 + - 4400.04 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 704 + - 2944 + - - 0 + - 3535.95 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1024 + - - 2 + - 4106.69 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 4 + - - 6 + - 82.772 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1408 + - - 0 + - 2654.29 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 448 + - - 3 + - 3379.49 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 448 + - 2368 + - - 3 + - 2521.25 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 2944 + - - 1 + - 4177.8 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 5056 + - - 6 + - 167.599 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 5888 + - - 1 + - 4228.5 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 4288 + - - 1 + - 4214.57 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1408 + - - 5 + - 2539.01 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1024 + - - 5 + - 3901.52 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 128 + - 6784 + - - 3 + - 3354.88 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 11.4137 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 448 + - - 3 + - 2765.1 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3584 + - - 0 + - 3690.82 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1408 + - - 1 + - 4184.21 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1408 + - - 0 + - 3108.57 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 6784 + - - 1 + - 3976.58 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 64 + - - 5 + - 1488.62 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 2944 + - - 1 + - 4125.34 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1024 + - - 3 + - 2724.02 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 5056 + - - 1 + - 4242.95 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 704 + - - 5 + - 4001.2 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 4 + - 4288 + - - 6 + - 118.631 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 704 + - - 5 + - 3209.86 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 4245.93 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1408 + - - 3 + - 3968.21 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 128 + - - 0 + - 1640.81 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 4288 + - - 3 + - 3969.99 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 5888 + - - 3 + - 4128.28 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1856 + - - 3 + - 3365.97 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 64 + - 64 + - - 5 + - 28.656 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 6784 + - - 1 + - 4301.03 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 764.961 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1408 + - - 3 + - 3358.94 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 4288 + - - 4 + - 4356.44 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 128 + - 3584 + - - 0 + - 2296.4 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 64 + - 5888 + - - 0 + - 2748.52 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 256 + - 5056 + - - 3 + - 3403.11 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 2944 + - - 3 + - 3271.25 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 128 + - - 5 + - 3106.07 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 2368 + - - 1 + - 4199.88 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 704 + - - 3 + - 3064.95 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 448 + - 6784 + - - 5 + - 3669.47 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 704 + - - 5 + - 1091.74 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 3 + - 3108.32 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3584 + - - 4 + - 4114.57 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 448 + - 704 + - - 5 + - 1710.41 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1856 + - - 1 + - 4048.53 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 4288 + - - 2 + - 4375.13 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1856 + - - 3 + - 3056.89 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 3584 + - - 1 + - 4078.37 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3584 + - - 2 + - 4385.26 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 5888 + - - 1 + - 4266.21 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1408 + - - 3 + - 2981.34 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 256 + - - 3 + - 2384.76 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 448 + - - 0 + - 3719.08 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 704 + - - 3 + - 2370.78 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 5056 + - - 2 + - 4030.12 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3144.93 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 2368 + - - 3 + - 4014.13 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3182.26 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 2944 + - - 6 + - 102.866 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 2944 + - - 3 + - 3928.88 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 5888 + - - 4 + - 4298.98 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 128 + - 5056 + - - 5 + - 2552.59 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 6784 + - - 0 + - 3555.36 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3584 + - - 1 + - 4062.15 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 442.314 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 5888 + - - 3 + - 4167.2 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 2368 + - - 3 + - 4072.45 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 128 + - 448 + - - 5 + - 601.425 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3584 + - - 0 + - 3903.22 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3584 + - - 4 + - 4363.34 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 5056 + - - 3 + - 3876.46 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 4288 + - - 3 + - 4142.95 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 448 + - - 5 + - 3515.64 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1024 + - - 0 + - 1410.17 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1856 + - - 5 + - 4201.36 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 704 + - 2944 + - - 3 + - 3102.86 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 448 + - - 0 + - 3897.55 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 448 + - - 3 + - 2916.8 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 2368 + - - 0 + - 3313.33 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 2368 + - - 0 + - 4127.77 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 5056 + - - 5 + - 2677.48 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3584 + - - 4 + - 4106.38 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3584 + - - 5 + - 3759.1 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1408 + - - 3 + - 3889.9 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2766.18 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1024 + - - 4 + - 3392.31 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 704 + - - 5 + - 3652.11 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1856 + - - 2 + - 4114.36 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 5888 + - - 0 + - 3931.65 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 3584 + - - 4 + - 4088.58 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 6784 + - - 1 + - 4264.6 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 64 + - - 5 + - 2393.97 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 128 + - - 6 + - 5.77385 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2702.46 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 64 + - - 5 + - 3232.71 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 4288 + - - 3 + - 4016.92 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 1795.26 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1408 + - - 3 + - 3651.26 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 397.985 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 256 + - - 3 + - 2923.86 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1856 + - - 3 + - 4140.71 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 5056 + - - 4 + - 4087.73 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 4108.79 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 2944 + - - 1 + - 4161.96 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 704 + - - 0 + - 2531.6 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 704 + - 5888 + - - 3 + - 3650.25 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 128 + - - 5 + - 1248.85 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 10.7814 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 64 + - - 5 + - 1091.32 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 448 + - - 0 + - 2731.77 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1408 + - - 5 + - 2705.09 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 704 + - - 5 + - 3644.53 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 448 + - - 3 + - 3441.81 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 3584 + - - 4 + - 4355.7 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 4288 + - - 5 + - 2678.95 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1856 + - - 3 + - 3687.53 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 4288 + - - 3 + - 3997.74 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 448 + - 4 + - - 6 + - 18.2225 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 256 + - 704 + - - 5 + - 1796.63 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1856 + - - 3 + - 3852.39 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1856 + - - 2 + - 3722.71 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 128 + - 128 + - - 5 + - 122.06 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 2368 + - - 3 + - 3684.15 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 2368 + - - 3 + - 3991.39 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 64 + - 704 + - - 0 + - 471.278 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3445.52 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 64 + - 2368 + - - 5 + - 1080.91 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 64 + - - 5 + - 1284.84 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 256 + - 4288 + - - 0 + - 3173.46 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 4 + - - 6 + - 37.2204 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 256 + - 6784 + - - 0 + - 3457.62 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 4 + - 128 + - - 6 + - 5.43 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 2368 + - - 5 + - 2514.34 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 4276.42 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 128 + - 3584 + - - 0 + - 3274.21 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1024 + - - 0 + - 760.575 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 448 + - - 0 + - 3564.22 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 546.018 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 128 + - - 5 + - 3248.47 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 4 + - 5056 + - - 6 + - 154.793 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1408 + - - 3 + - 3298.29 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 3584 + - - 3 + - 2785.95 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1024 + - - 3 + - 3645.14 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 64 + - - 0 + - 95.9735 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 2944 + - - 1 + - 4141.45 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 5056 + - - 3 + - 3888.62 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 128 + - - 5 + - 1337.19 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 2368 + - - 3 + - 3801.51 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 6784 + - - 1 + - 4377.32 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 4 + - - 6 + - 127.696 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 4 + - - 6 + - 142.208 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 3584 + - - 4 + - 4241.77 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 6784 + - - 6 + - 219.994 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 256 + - - 5 + - 2978.48 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 2368 + - - 3 + - 4103.33 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 448 + - - 0 + - 3374.02 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 216.495 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1408 + - - 0 + - 2915.64 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 4 + - 3584 + - - 6 + - 100.063 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 64 + - - 5 + - 1089.32 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 3584 + - - 2 + - 4118.68 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 448 + - 3584 + - - 3 + - 2729.9 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 448 + - - 0 + - 3101.32 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 64 + - - 5 + - 2207.16 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 382.64 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 6784 + - - 0 + - 4087.13 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3975.75 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 3 + - 2598.69 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 64 + - - 6 + - 2.85864 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 3584 + - - 1 + - 4014.94 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 2368 + - - 1 + - 3977.02 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 6784 + - - 3 + - 3942.58 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 1189.59 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 4 + - - 6 + - 2.78307 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 704 + - 128 + - - 5 + - 941.598 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 2944 + - - 1 + - 3872.53 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1856 + - - 0 + - 3874.81 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1024 + - - 4 + - 3603.09 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 448 + - 5888 + - - 3 + - 3386.81 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 704 + - - 5 + - 2726.63 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 3584 + - - 1 + - 4275.11 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 448 + - - 3 + - 3259.95 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1024 + - - 2 + - 3951.87 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 4288 + - - 4 + - 4366.67 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1856 + - - 5 + - 1434.07 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 704 + - - 5 + - 3703.12 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 6784 + - - 1 + - 4221.55 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 2944 + - - 3 + - 3693.09 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1024 + - - 3 + - 3436.38 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1856 + - - 4 + - 4077.22 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 256 + - 5888 + - - 0 + - 3239.3 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1024 + - - 0 + - 2263.62 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 64 + - 3584 + - - 0 + - 2182.38 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 5 + - 1413.49 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 2853.3 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 64 + - - 5 + - 683.208 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 128 + - 4 + - - 6 + - 4.35437 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 2368 + - - 5 + - 1733.62 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1856 + - - 5 + - 2819.97 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 4288 + - - 3 + - 3793.18 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 5056 + - - 2 + - 3965.06 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 1331.51 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 64 + - - 0 + - 2676.56 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 2944 + - - 0 + - 3290.5 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 3584 + - - 5 + - 3684.08 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 448 + - - 5 + - 3666.83 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 2944 + - - 5 + - 2247.73 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 5056 + - - 3 + - 4085.38 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 4 + - 2944 + - - 6 + - 97.1723 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 170.47 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 5056 + - - 3 + - 3750.12 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 2944 + - - 0 + - 3852.27 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1024 + - - 4 + - 3334.32 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1408 + - - 3 + - 3909.9 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 448 + - 448 + - - 5 + - 1975.49 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 6784 + - - 1 + - 4175.26 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3584 + - - 1 + - 4286.17 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 128 + - - 5 + - 2618.29 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 704 + - 5056 + - - 3 + - 3504.31 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1024 + - - 3 + - 3489.25 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 2944 + - - 1 + - 4288.48 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 4 + - 5888 + - - 6 + - 149.024 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 128 + - 2944 + - - 5 + - 2762.93 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 5888 + - - 2 + - 4388.07 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 2944 + - - 1 + - 4258.33 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1856 + - - 5 + - 4067.08 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 448 + - 704 + - - 5 + - 2343.84 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1024 + - - 3 + - 2882.96 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 4 + - 4 + - - 6 + - 0.167285 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 128 + - - 0 + - 252.345 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 4288 + - - 2 + - 4329.74 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 3 + - 2043.4 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 3584 + - - 4 + - 4209.22 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1408 + - - 6 + - 52.9228 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 64 + - - 5 + - 759.656 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1408 + - - 3 + - 3952.8 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 5888 + - - 0 + - 3095.14 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 5888 + - - 3 + - 3892.37 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1408 + - - 0 + - 1918.56 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 3584 + - - 4 + - 4011.18 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1408 + - - 3 + - 3842.39 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 4288 + - - 0 + - 3819.09 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 5056 + - - 3 + - 4012.01 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 64 + - 4 + - - 6 + - 2.18921 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1024 + - - 4 + - 3673.03 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 64 + - - 5 + - 2706.1 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 5056 + - - 3 + - 4009.41 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1024 + - - 3 + - 3090.74 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 3584 + - - 4 + - 4087.91 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 3866.84 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 64 + - - 5 + - 1860.78 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 4288 + - - 4 + - 4328.08 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 5056 + - - 4 + - 4099.19 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 5888 + - - 1 + - 4197.38 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 6784 + - - 1 + - 4198.1 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1024 + - - 3 + - 2847.6 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 5888 + - - 3 + - 4142.4 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 6784 + - - 0 + - 3996.33 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 4288 + - - 3 + - 3914.84 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 6784 + - - 1 + - 4250.91 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 4 + - - 6 + - 132.309 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 64 + - - 0 + - 2035.98 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 704 + - - 6 + - 26.4869 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1024 + - - 4 + - 3550.13 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 3584 + - - 4 + - 4319.25 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 2368 + - - 3 + - 3776.85 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3707.19 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1408 + - - 0 + - 1235.65 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1024 + - - 4 + - 3547.96 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 2368 + - - 3 + - 3869.81 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 64 + - - 5 + - 3151.13 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 64 + - - 0 + - 525.454 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 704 + - - 0 + - 2456.3 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 4 + - - 6 + - 26.3506 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 4 + - - 6 + - 216.495 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 4 + - - 6 + - 100.881 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1408 + - - 3 + - 4014.39 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 3611.13 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 64 + - - 0 + - 99.7293 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 128 + - - 5 + - 3718.19 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 4288 + - - 4 + - 4293.61 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 3584 + - - 4 + - 4198.46 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1408 + - - 5 + - 3209.46 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3250.19 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 3584 + - - 1 + - 4044.21 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 4288 + - - 3 + - 4003.9 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 64 + - - 5 + - 1374.65 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 2368 + - - 1 + - 4211.22 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3837.98 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1408 + - - 1 + - 4180.09 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1856 + - - 5 + - 3818.01 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1856 + - - 3 + - 3440.88 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 3584 + - - 1 + - 4038.56 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 64 + - - 5 + - 1747.73 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 256 + - - 5 + - 2646.85 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 448 + - - 6 + - 18.4378 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 2944 + - - 3 + - 4010.93 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 5056 + - - 3 + - 4017.88 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 5056 + - - 1 + - 4207.49 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 343.822 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 2368 + - - 0 + - 3429.79 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 504.772 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 448 + - 2944 + - - 3 + - 3069.33 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 64 + - - 5 + - 46.7448 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 5056 + - - 3 + - 4102.31 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 128 + - 704 + - - 5 + - 686.57 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 5056 + - - 4 + - 4381.53 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 298.301 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2826.64 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 2944 + - - 3 + - 3838.04 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 2944 + - - 1 + - 4248.99 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 128 + - - 5 + - 1092.63 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 704 + - - 5 + - 3577.71 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1024 + - - 4 + - 3625.92 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1856 + - - 0 + - 4106.48 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 448 + - - 5 + - 696.217 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 448 + - - 5 + - 2815.38 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 2944 + - - 3 + - 3965.97 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3665.63 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 448 + - - 0 + - 2288.28 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 704 + - - 5 + - 2616.79 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3584 + - - 4 + - 4248.43 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 448 + - - 0 + - 1330.23 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 704 + - - 3 + - 3444.16 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 704 + - 2368 + - - 5 + - 3339.21 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 4 + - - 6 + - 104.423 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1024 + - - 0 + - 2173.33 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 4288 + - - 4 + - 4272.88 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 5888 + - - 3 + - 4047.97 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 4 + - 704 + - - 6 + - 27.9776 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 6784 + - - 0 + - 3814.9 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 5056 + - - 1 + - 4052.15 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 5888 + - - 4 + - 4400.94 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 5888 + - - 6 + - 189.146 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 5888 + - - 1 + - 4338.08 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 4288 + - - 1 + - 4320.35 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1856 + - - 3 + - 3415.85 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 3584 + - - 1 + - 4211.56 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 448 + - - 3 + - 3470.26 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 4288 + - - 3 + - 4113.36 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 5056 + - - 3 + - 4122.79 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1408 + - - 5 + - 3624.38 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 256 + - - 0 + - 191.101 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 128 + - 704 + - - 5 + - 940.712 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 448 + - - 0 + - 3860.84 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 64 + - 6784 + - - 0 + - 3144.95 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 448 + - - 5 + - 3850.58 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 448 + - - 0 + - 3858.56 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 704 + - - 5 + - 3711.98 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1856 + - - 4 + - 4106.89 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 704 + - - 5 + - 4074.94 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 2368 + - - 5 + - 2621.52 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2483.94 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 704 + - 5056 + - - 2 + - 3789.96 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 4 + - - 6 + - 36.9678 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 704 + - - 5 + - 1049.2 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 6784 + - - 6 + - 212.208 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 448 + - 5888 + - - 3 + - 3613.02 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 6784 + - - 0 + - 3717.66 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1408 + - - 5 + - 679.986 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1024 + - - 3 + - 3486.08 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 4288 + - - 4 + - 4312.4 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1024 + - - 3 + - 2795.61 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3559.29 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 5056 + - - 0 + - 3782.95 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 704 + - - 2 + - 3794.09 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 64 + - 448 + - - 5 + - 299.1 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1408 + - - 1 + - 3981.44 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 4288 + - - 0 + - 3447.47 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 2368 + - - 1 + - 4091.67 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1856 + - - 5 + - 3862.57 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1408 + - - 5 + - 2787.45 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 704 + - - 0 + - 3037.72 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 128 + - 128 + - - 5 + - 172.036 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 2944 + - - 3 + - 3805.83 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 4 + - - 6 + - 39.1339 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1856 + - - 6 + - 69.724 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 64 + - - 5 + - 2133.52 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 4 + - - 6 + - 66.0936 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 2368 + - - 3 + - 3855.84 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 704 + - - 3 + - 3804.97 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1856 + - - 3 + - 2752.33 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 2944 + - - 1 + - 4202.29 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 3584 + - - 2 + - 3543.21 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3584 + - - 0 + - 3528.38 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 3584 + - - 0 + - 3435.87 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 2368 + - - 3 + - 3965.76 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1024 + - - 5 + - 1575.26 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1024 + - - 0 + - 496.33 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 4288 + - - 5 + - 2371.5 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 704 + - - 3 + - 3035.65 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 4 + - 2368 + - - 6 + - 66.8813 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 5888 + - - 0 + - 3289.92 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 2944 + - - 2 + - 4250.44 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 5056 + - - 1 + - 4256.68 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 5888 + - - 5 + - 3876.51 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 3584 + - - 2 + - 4251.54 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 4 + - - 6 + - 67.2311 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 2368 + - - 5 + - 1820.1 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1856 + - - 3 + - 3828.99 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 4 + - - 6 + - 118.07 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 4 + - 128 + - - 6 + - 4.4929 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 128 + - - 5 + - 2665.48 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 4288 + - - 4 + - 4324.92 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 4 + - - 6 + - 126.945 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 5056 + - - 1 + - 4245.26 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 4 + - - 6 + - 26.6986 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 6784 + - - 3 + - 3678.82 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 64 + - 3584 + - - 0 + - 1484.44 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 2368 + - - 3 + - 4141.21 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1024 + - - 3 + - 3301.25 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 3543.23 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 2388.63 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 1387.47 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 4 + - - 6 + - 53.9165 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 2935.16 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 4288 + - - 3 + - 3851.88 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1856 + - - 6 + - 67.8511 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 64 + - - 5 + - 2243.33 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 0 + - 126.926 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 704 + - - 3 + - 3364.54 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1024 + - - 3 + - 2373.69 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 5056 + - - 4 + - 4413.13 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 64 + - 128 + - - 0 + - 85.7244 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 5888 + - - 1 + - 4286.35 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 4288 + - - 6 + - 142.313 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 2368 + - - 5 + - 4100.03 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 4288 + - - 6 + - 147.689 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1856 + - - 5 + - 1372.62 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 2368 + - - 5 + - 2700.41 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 64 + - 5056 + - - 5 + - 1749.11 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 448 + - 4 + - - 6 + - 14.6511 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 128 + - 4 + - - 6 + - 5.31222 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 4 + - 5056 + - - 6 + - 132.49 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 128 + - - 0 + - 99.6225 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1856 + - - 6 + - 67.8806 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 5056 + - - 0 + - 3677.35 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 5056 + - - 4 + - 4067.5 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 2944 + - - 1 + - 4114.77 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1024 + - - 3 + - 2363.6 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 4 + - 4 + - - 6 + - 0.132643 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 4 + - 2368 + - - 6 + - 80.2433 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1408 + - - 5 + - 3129.04 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 2368 + - - 1 + - 4027.48 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 5056 + - - 3 + - 3935.93 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 5056 + - - 1 + - 4326.23 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 2368 + - - 3 + - 4103.96 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 5888 + - - 4 + - 4318.6 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 2368 + - - 1 + - 4104.1 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1024 + - - 4 + - 3324.52 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 5056 + - - 4 + - 4222.28 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 448 + - - 5 + - 1387.06 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 6784 + - - 0 + - 3724.13 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 4 + - - 6 + - 210.45 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 4097.23 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 128 + - - 5 + - 2764.34 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1856 + - - 3 + - 3881.01 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 122.06 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 5888 + - - 5 + - 3782.58 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 4042.23 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 5888 + - - 1 + - 4317.1 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 4 + - 64 + - - 6 + - 2.70127 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 128 + - 4288 + - - 5 + - 1921.77 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1408 + - - 3 + - 3836.14 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 6784 + - - 1 + - 4388.59 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 5888 + - - 0 + - 3963.54 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 5888 + - - 0 + - 3239.97 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 64 + - - 0 + - 2790.18 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 5888 + - - 3 + - 3700.3 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1024 + - - 2 + - 3401.63 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1024 + - - 0 + - 1944.01 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1856 + - - 0 + - 1225.2 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 4288 + - - 3 + - 4055.91 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 6784 + - - 1 + - 4409.39 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1408 + - - 3 + - 4118.01 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 4288 + - - 3 + - 4113.12 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 448 + - - 5 + - 2725.95 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1024 + - - 4 + - 3581.47 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1856 + - - 4 + - 4265.51 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 4 + - 64 + - - 6 + - 2.20612 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1408 + - - 0 + - 2152.47 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 5888 + - - 3 + - 3949.97 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 4288 + - - 3 + - 3776.65 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3584 + - - 0 + - 2703.7 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 2368 + - - 3 + - 3976.11 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 5056 + - - 2 + - 4200.55 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1408 + - - 3 + - 4043.67 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 5888 + - - 4 + - 4261.96 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 5888 + - - 3 + - 4092.65 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 704 + - - 5 + - 3815.54 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 448 + - - 0 + - 3430.22 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 256 + - - 5 + - 3108.26 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 128 + - 2944 + - - 0 + - 1985.29 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 5056 + - - 5 + - 2858.07 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 4 + - - 6 + - 112.177 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 1238.66 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 2944 + - - 6 + - 106.164 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1024 + - - 2 + - 3925.16 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 2944 + - - 0 + - 3738.38 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 704 + - - 5 + - 3710.59 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 448 + - 4288 + - - 5 + - 3800.78 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 448 + - - 0 + - 3789.71 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 704 + - - 0 + - 3561.84 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 2944 + - - 5 + - 3909.2 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 4 + - - 6 + - 182.654 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 64 + - 4 + - - 6 + - 2.62659 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 6784 + - - 1 + - 4399.29 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 128 + - - 0 + - 382.627 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 128 + - - 5 + - 2158.21 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 2944 + - - 4 + - 4193.73 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 6784 + - - 1 + - 4273.81 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 704 + - - 5 + - 1238.83 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1408 + - - 3 + - 3906.13 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 5888 + - - 1 + - 4349.57 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 5888 + - - 0 + - 3569.22 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1856 + - - 4 + - 4095.42 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 128 + - - 5 + - 948.368 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1408 + - - 5 + - 4093.9 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 448 + - - 5 + - 2518.46 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4288 + - - 3 + - 2591.66 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 4 + - - 6 + - 18.2679 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1856 + - - 0 + - 3509.68 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 448 + - 5056 + - - 3 + - 3644.56 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1856 + - - 3 + - 3310.94 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1408 + - - 6 + - 51.6418 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 64 + - - 5 + - 49.4489 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1856 + - - 5 + - 2664.59 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 6784 + - - 1 + - 4351.47 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 128 + - 6784 + - - 3 + - 2817.05 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 64 + - 5056 + - - 5 + - 2395.32 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1408 + - - 0 + - 3688.14 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 4 + - - 6 + - 94.74 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 4 + - 6784 + - - 6 + - 166.161 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 128 + - 64 + - - 5 + - 86.5101 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 448 + - - 0 + - 3628.55 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 704 + - - 0 + - 3535.45 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1408 + - - 1 + - 4141.53 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 704 + - - 5 + - 3661.36 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1024 + - - 4 + - 3607.26 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 5888 + - - 4 + - 4288.02 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 4288 + - - 1 + - 4204.24 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 2368 + - - 5 + - 4152.44 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 2944 + - - 0 + - 3627.43 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 4 + - - 6 + - 188.591 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 4 + - 4288 + - - 6 + - 132.797 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 3584 + - - 2 + - 3968.31 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 2944 + - - 0 + - 3632.22 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 4288 + - - 4 + - 4282.99 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 4 + - - 6 + - 0.183805 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1408 + - - 0 + - 2043.93 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1408 + - - 3 + - 3908.87 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1024 + - - 5 + - 2971.61 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2793.03 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 3584 + - - 0 + - 3726.19 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1408 + - - 6 + - 54.6578 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 704 + - - 5 + - 3816.87 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 704 + - 448 + - - 5 + - 2344.93 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 448 + - - 0 + - 3674.29 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 128 + - - 5 + - 1569.46 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 256 + - 3584 + - - 0 + - 3484.11 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 347.676 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1856 + - - 4 + - 4220.72 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1024 + - - 6 + - 37.5087 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 2944 + - - 1 + - 4297.39 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1856 + - - 1 + - 3871.56 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 4 + - 3584 + - - 6 + - 114.403 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1024 + - - 4 + - 3313.85 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 601.949 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 704 + - - 0 + - 3130.33 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 5056 + - - 6 + - 173.395 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 128 + - - 5 + - 1984.85 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 5056 + - - 4 + - 4116.81 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 5888 + - - 3 + - 4135.04 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1024 + - - 4 + - 3696.76 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1856 + - - 3 + - 3997.78 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 5056 + - - 2 + - 4053.86 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 686.243 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1856 + - - 3 + - 4057.75 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 4288 + - - 3 + - 4109.55 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 4 + - - 6 + - 122.487 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 5888 + - - 3 + - 3991.21 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 128 + - - 5 + - 3906.41 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 4286.38 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 2368 + - - 3 + - 4145.31 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1408 + - - 3 + - 3961.42 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 3 + - 3018.28 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 448 + - - 5 + - 347.743 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 5888 + - - 3 + - 3945.17 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 448 + - - 5 + - 2614.85 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 64 + - - 5 + - 1230.48 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1024 + - - 1 + - 3550.41 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1408 + - - 0 + - 2967.53 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1408 + - - 3 + - 4170.01 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 128 + - - 0 + - 2247.88 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 4288 + - - 4 + - 4346.55 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1408 + - - 3 + - 2123.86 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 696.352 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5888 + - - 3 + - 2749.88 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 448 + - - 0 + - 669.201 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 4 + - - 6 + - 52.2966 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 795.382 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 4 + - 448 + - - 6 + - 14.8561 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3584 + - - 2 + - 4172.03 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 4288 + - - 3 + - 3968.91 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 4 + - - 6 + - 36.9126 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 704 + - - 0 + - 2050.29 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 704 + - - 3 + - 3498.86 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 4 + - 448 + - - 6 + - 18.5261 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 448 + - - 5 + - 861.912 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1408 + - - 5 + - 1045.36 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 704 + - - 6 + - 29.7186 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 6784 + - - 1 + - 4332.96 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 3 + - 2708.49 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 4 + - - 6 + - 66.6622 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 2944 + - - 0 + - 3742.3 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 64 + - - 5 + - 1491.88 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 6784 + - - 1 + - 4317.81 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 11.2672 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 6784 + - - 1 + - 4111.36 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 704 + - - 3 + - 3985.35 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 64 + - - 5 + - 1046.04 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 4 + - - 7 + - 83.4965 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1024 + - - 4 + - 3399.45 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 3584 + - - 1 + - 3869.75 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 2368 + - - 3 + - 3919.78 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 704 + - - 3 + - 2251.05 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 128 + - - 5 + - 199.564 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 4288 + - - 0 + - 3788.4 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1856 + - - 0 + - 3742.99 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 128 + - 2368 + - - 5 + - 2251.59 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1856 + - - 0 + - 3686.3 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 64 + - - 0 + - 1818.98 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 64 + - 128 + - - 5 + - 59.2016 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 6784 + - - 4 + - 4172.14 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1024 + - - 2 + - 4165.04 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 2049.32 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 4 + - - 6 + - 19.5435 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 2368 + - - 3 + - 4015.31 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1856 + - - 3 + - 3939.11 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1024 + - - 4 + - 2985.41 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 704 + - - 5 + - 2772.32 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 448 + - 4288 + - - 3 + - 3442.58 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1408 + - - 5 + - 1794.77 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 3584 + - - 1 + - 4084.55 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 4 + - - 6 + - 51.0511 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1408 + - - 0 + - 3398.36 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 5888 + - - 1 + - 4179.61 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1024 + - - 2 + - 3301.45 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 3584 + - - 1 + - 3823.13 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 448 + - - 5 + - 3743.66 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 5056 + - - 0 + - 3987.33 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 5056 + - - 3 + - 3985.79 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 256 + - - 3 + - 3499.15 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1024 + - - 2 + - 3963.02 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 3584 + - - 0 + - 3843.44 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 704 + - 5888 + - - 3 + - 3834.02 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 6784 + - - 4 + - 4259.17 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 5056 + - - 3 + - 4112.46 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 4 + - - 6 + - 146.59 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 64 + - 2944 + - - 5 + - 1858.36 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 3584 + - - 1 + - 4114.91 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1024 + - - 3 + - 2943.69 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 5888 + - - 2 + - 4413.74 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 4 + - - 6 + - 83.8565 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 128 + - - 3 + - 2193.79 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 5056 + - - 1 + - 4255.61 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 4288 + - - 4 + - 4085.74 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 6784 + - - 1 + - 4350.26 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 4288 + - - 3 + - 3955.83 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1408 + - - 5 + - 3746.6 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 256 + - - 5 + - 2264.66 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 704 + - - 3 + - 3247.55 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 4288 + - - 0 + - 4212.78 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 6784 + - - 3 + - 4072.95 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 5888 + - - 2 + - 4157.73 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 128 + - - 3 + - 2456.1 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 345.423 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1024 + - - 0 + - 954.555 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 4 + - 5888 + - - 6 + - 174.397 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 5888 + - - 5 + - 3187.19 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 2944 + - - 3 + - 3534.91 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 64 + - 256 + - - 5 + - 171.026 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 128 + - - 5 + - 1507.66 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1024 + - - 3 + - 3695.39 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 2157.43 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 2944 + - - 1 + - 4216.23 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 6784 + - - 1 + - 4359.85 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 128 + - - 0 + - 2817.72 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 2368 + - - 3 + - 4114.79 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1856 + - - 0 + - 3627.79 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 64 + - - 5 + - 3079.63 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 4 + - - 6 + - 69.1257 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 2944 + - - 5 + - 3779.01 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1856 + - - 5 + - 1554.43 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 4268.82 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 64 + - 4288 + - - 5 + - 1490.3 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1856 + - - 1 + - 4017.69 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1408 + - - 3 + - 3682.75 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 448 + - - 3 + - 3386.34 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1408 + - - 3 + - 3195.56 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 704 + - - 0 + - 3140.55 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 4288 + - - 4 + - 4285.06 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 5056 + - - 1 + - 4273.65 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1856 + - - 5 + - 3711.26 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 4 + - - 6 + - 2.86579 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 2944 + - - 2 + - 4122.76 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 448 + - - 3 + - 3642.0 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 4288 + - - 3 + - 4043.21 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 704 + - - 0 + - 3785.63 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 4 + - - 6 + - 29.3126 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 3584 + - - 0 + - 2541.32 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 4239.29 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 5888 + - - 4 + - 4125.3 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 64 + - - 5 + - 2247.13 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 128 + - - 5 + - 1050.62 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 2944 + - - 3 + - 3832.33 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 128 + - - 5 + - 3255.81 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2543.53 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 2368 + - - 3 + - 3977.51 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 2368 + - - 3 + - 3470.98 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 4288 + - - 3 + - 4017.6 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1408 + - - 5 + - 3976.29 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 5888 + - - 1 + - 4280.99 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 2368 + - - 3 + - 4106.89 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 64 + - 2368 + - - 0 + - 1531.69 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 128 + - - 0 + - 398.133 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 6784 + - - 4 + - 4188.38 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1856 + - - 4 + - 4279.32 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1856 + - - 3 + - 3845.33 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 2622.83 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 2368 + - - 5 + - 4199.02 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 64 + - - 5 + - 886.036 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 64 + - - 6 + - 2.94754 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 4288 + - - 4 + - 4241.8 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 4280.4 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1408 + - - 5 + - 1090.28 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1024 + - - 0 + - 1509.32 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 128 + - 5888 + - - 3 + - 2493.35 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 64 + - - 5 + - 2551.58 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1024 + - - 0 + - 682.324 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 6784 + - - 3 + - 3896.62 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 448 + - 3584 + - - 5 + - 3216.81 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 5056 + - - 3 + - 4103.68 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 448 + - - 0 + - 3908.97 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1856 + - - 0 + - 3414.84 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 704 + - - 3 + - 4058.86 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 448 + - - 0 + - 3268.86 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1408 + - - 3 + - 4002.72 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 190.71 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 448 + - 5056 + - - 3 + - 3357.35 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 448 + - - 5 + - 3338.97 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 128 + - 4288 + - - 0 + - 2480.52 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 2918.04 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1024 + - - 5 + - 2301.92 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 3584 + - - 5 + - 3747.36 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 448 + - - 0 + - 3978.56 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 3 + - 2843.69 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 704 + - 4288 + - - 5 + - 3650.35 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 6784 + - - 1 + - 4427.56 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 2944 + - - 5 + - 3950.8 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 128 + - - 5 + - 2305.25 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 5888 + - - 3 + - 4180.56 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 3584 + - - 6 + - 123.765 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 448 + - 2368 + - - 0 + - 3094.47 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 64 + - - 5 + - 1975.32 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 704 + - - 3 + - 3103.64 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 11.594 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 5056 + - - 0 + - 3887.05 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 5056 + - - 3 + - 3991.07 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 64 + - 6784 + - - 0 + - 2242.84 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 6784 + - - 1 + - 4184.84 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 5888 + - - 4 + - 4389.36 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 2368 + - - 3 + - 3876.97 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 4288 + - - 1 + - 4226.88 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 5056 + - - 2 + - 4243.0 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 448 + - - 5 + - 2269.53 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 3584 + - - 1 + - 3876.57 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1408 + - - 3 + - 3915.02 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 4 + - - 6 + - 5.69094 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 3286.4 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1856 + - - 1 + - 4082.85 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 4 + - - 6 + - 79.0114 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 2368 + - - 3 + - 3926.34 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 2368 + - - 3 + - 4061.34 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 6784 + - - 2 + - 3967.47 +- null diff --git a/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml b/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml new file mode 100644 index 000000000..0f1b345d7 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml @@ -0,0 +1,11955 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 8 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x64x8_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 16 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x64x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 85.8659 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 6 + - 126.0 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4131.48 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4428.58 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 4 + - 2372.29 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 702.051 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 2207.44 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4346.21 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 175.395 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 4 + - 2084.25 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 3531.52 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3987.08 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 4.47573 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 6 + - 160.867 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4148.65 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 3974.74 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3529.36 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 11.3224 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 3008.68 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4164.25 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1371.73 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 2639.09 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 116.897 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 4 + - 3241.07 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 2 + - 2702.65 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 1 + - 3799.9 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4458.37 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 4 + - 3455.76 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4155.22 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 4 + - 1796.4 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4428.83 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4082.8 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 3944.77 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 18.26 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4419.18 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 2263.71 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 11.1269 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 973.122 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 0 + - 3521.12 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 7 + - 66.6068 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 4 + - 1399.93 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3551.99 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3999.21 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3965.86 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4140.72 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3463.37 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 599.676 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 6 + - 98.756 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4195.0 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4276.85 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 3113.24 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 4 + - 2069.13 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4297.69 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4351.4 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4404.1 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 2787.8 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 108.888 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4154.23 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 4 + - 3212.76 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 2 + - 2909.47 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3644.19 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 134.921 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 3294.38 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2967.8 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 3715.59 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 3532.34 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4228.72 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 1644.0 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 4111.2 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 2007.27 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 1839.47 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 17.7941 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4233.35 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 640.322 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 38.1032 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4339.85 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 133.74 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 5.31723 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2846.54 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3601.5 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 1 + - 4139.06 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 6 + - 112.043 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4209.45 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 545.16 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 7 + - 0.129381 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 171.592 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4380.51 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 83.6644 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 3807.05 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 3971.62 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 3989.46 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 4 + - 1828.11 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 4 + - 2152.29 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4420.97 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 4 + - 3792.89 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 4345.66 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 18.1234 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 1237.32 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 3870.81 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 2177.8 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 3253.82 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 311.788 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 3358.09 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4173.86 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 4 + - 3135.3 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 299.14 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 4 + - 1771.61 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 617.859 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4499.41 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 3912.61 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4491.07 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 3361.78 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 6 + - 86.4953 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 3504.5 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 3931.48 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 83.6254 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 2 + - 3128.48 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 156.691 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4238.65 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4376.43 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4330.46 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 2.5886 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4220.07 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 4 + - 3152.32 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 3465.0 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 2224.62 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 2074.01 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 1193.48 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3252.91 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 1844.0 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 237.342 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 4 + - 2442.01 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4162.27 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 342.225 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 323.901 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 3974.28 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3420.33 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 66.3638 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 270.81 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 1308.95 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3960.37 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 3827.66 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 2 + - 2984.7 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4045.85 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 2 + - 3159.54 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 4 + - 3337.75 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4438.26 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4371.87 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 117.712 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 65.2676 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3983.44 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3420.08 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 2003.53 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4290.62 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 486.923 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4212.23 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4368.14 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 2 + - 3616.37 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3612.48 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 2 + - 3591.67 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3478.54 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 177.026 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 6 + - 146.766 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 1278.81 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 971.81 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 2 + - 2876.7 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 4240.96 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4318.06 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 2 + - 2208.57 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 2917.28 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4238.0 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 2.8551 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 2581.76 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 2 + - 3438.52 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 2855.58 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4304.2 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 6 + - 68.3931 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 3847.09 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 106.38 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 4 + - 3466.6 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 3818.04 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 2706.07 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4390.57 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 973.223 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 2520.87 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 1 + - 4031.16 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4211.28 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 3917.47 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 1081.82 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4391.63 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 4 + - 1603.55 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 2 + - 3073.59 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1016.7 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4032.15 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 4 + - 2018.81 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 0 + - 3578.48 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 105.872 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 28.5936 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 641.842 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4166.77 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 7 + - 152.668 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 3889.62 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 2909.64 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4240.33 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4398.42 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 2 + - 3127.64 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 2789.69 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1472.72 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4427.89 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 1746.49 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3335.98 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 4 + - 2491.91 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4286.95 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4513.2 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 3905.23 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 2501.33 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4320.44 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3847.15 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4450.1 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 1562.15 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 4078.36 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 813.39 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 10.5545 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 3404.04 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3878.26 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 3096.47 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 4 + - 2839.65 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 3949.79 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 1 + - 3620.54 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4291.23 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 2 + - 2716.72 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3600.09 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4134.21 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4219.34 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 3591.88 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 3883.36 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3562.83 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4303.51 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 1 + - 3964.3 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4132.39 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 4 + - 3524.34 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 2 + - 3183.53 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 2 + - 2681.31 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 2744.04 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 3700.79 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4237.23 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 2671.88 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 2392.8 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4301.81 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 2 + - 3587.41 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4287.93 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 1 + - 4062.15 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4230.32 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 3154.27 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4033.56 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4341.11 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4203.36 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 907.203 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 4 + - 1165.24 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3858.51 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3872.4 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 2312.38 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3536.18 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 19.4596 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4407.57 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 4 + - 3548.1 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 4 + - 3538.51 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 0 + - 3876.59 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 4 + - 3620.31 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 37.2908 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2522.63 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 2283.9 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 177.085 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4482.96 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3189.17 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 469.436 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4089.54 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 4 + - 3595.4 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 85.5961 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4210.42 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3599.65 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 145.789 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 3864.67 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3047.55 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 1392.8 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 1 + - 3840.63 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 3890.05 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4019.7 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 4200.22 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3626.32 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 113.139 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4208.82 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4115.61 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4291.24 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 4 + - 1825.87 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3803.13 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 4 + - 3713.96 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 466.587 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 941.001 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 122.644 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 2830.82 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4550.77 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 2 + - 2813.17 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3212.09 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 3659.11 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 4 + - 1117.38 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 5 + - 3850.82 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4293.64 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4372.66 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3314.5 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 65.7843 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 77.2831 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3472.0 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4484.4 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 42.0475 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 3521.99 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4305.4 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 39.5969 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 3783.92 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4220.54 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 3812.62 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 1925.91 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 26.4778 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 3581.57 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 69.3786 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 3875.64 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 2396.93 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 3643.55 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3837.09 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 2930.26 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 3981.74 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 1500.98 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4406.67 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 1 + - 3964.6 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 153.951 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2004.6 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 6 + - 39.0944 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 3591.41 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3503.53 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 6 + - 65.2871 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3556.53 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4335.45 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 3884.18 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 3209.76 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 310.113 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4338.32 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 4 + - 1232.18 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 4 + - 458.427 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 855.55 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3777.0 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 4 + - 2296.02 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4170.19 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4382.03 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 37.6909 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 2 + - 3136.93 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3989.26 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4251.7 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4436.7 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 2 + - 3257.99 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3273.65 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 5 + - 3925.06 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 5.57925 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4510.07 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4092.01 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 3314.93 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4390.69 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 0 + - 3183.94 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 3650.6 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4221.88 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4185.39 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 3839.13 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 1635.92 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1819.52 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 2847.72 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 4 + - 3528.36 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 5 + - 4034.28 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 3942.86 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 4 + - 884.75 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3403.68 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 2 + - 3373.25 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4407.27 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3791.92 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4439.62 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 707.811 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3320.49 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 4 + - 2824.93 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3306.71 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 3386.86 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 2901.12 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 2365.11 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4220.64 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 1919.23 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 4 + - 2654.59 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4099.85 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4235.16 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 6 + - 141.164 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 1561.99 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 6 + - 163.726 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 3243.82 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4262.05 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 620.839 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 6 + - 122.084 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 4146.4 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3645.2 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 3092.71 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 972.701 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 4 + - 2004.99 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 940.27 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 2819.19 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 3158.57 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 2 + - 2422.91 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4352.68 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1114.25 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 4 + - 3282.36 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3516.01 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 3392.83 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 50.9029 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 323.95 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 2253.61 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 1353.04 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 1929.22 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 2 + - 3587.43 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 0 + - 3835.87 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 706.515 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3440.15 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3885.38 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 5 + - 3824.47 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 3726.59 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 2899.6 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 546.097 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 2810.3 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 4 + - 3308.83 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 1838.35 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 2844.89 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4436.46 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 413.849 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 3834.88 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 4 + - 2072.73 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 3355.64 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4172.09 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 2016.12 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4140.09 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4263.85 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 1175.69 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2921.92 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 4 + - 2420.36 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4470.25 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 18.7769 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 0 + - 3584.48 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 2 + - 3157.79 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 2 + - 3116.27 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 2041.0 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 2004.82 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 2 + - 3368.5 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 2394.34 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3990.62 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4053.64 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 103.51 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 4 + - 2992.13 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 4.3018 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 0 + - 3655.24 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4355.33 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 1 + - 3743.87 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4279.05 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4359.76 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4052.58 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 1 + - 3966.69 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 3961.7 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 413.601 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 4 + - 3466.5 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 3298.18 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3834.83 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 2681.82 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 2293.28 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3383.62 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 3942.93 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1504.24 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 2005.1 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 2842.87 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 3944.01 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4505.84 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 2598.79 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 4 + - 2849.46 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 3799.8 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 3109.47 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 1666.17 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 2 + - 2697.01 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 3757.73 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 88.8594 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 1755.18 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 6 + - 216.435 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 4174.1 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 2673.84 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4413.93 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4071.28 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 2915.75 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 3194.29 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4344.42 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 599.545 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 51.9619 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4358.44 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 75.0678 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2456.82 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 3914.79 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 6 + - 210.043 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 355.184 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 1 + - 4222.24 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3766.21 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2309.9 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4375.64 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4400.81 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 3512.95 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4372.96 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 2 + - 3314.6 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 2788.15 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 2 + - 3470.94 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4224.05 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 426.706 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 4 + - 1212.98 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4383.27 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4170.99 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 6 + - 20.853 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4219.89 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4305.85 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 2414.41 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 27.5612 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 3823.27 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 0.180014 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 2709.42 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 6 + - 66.4912 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 26.8365 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2846.36 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 486.132 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 2870.45 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4284.18 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 1237.36 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 161.971 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 473.754 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 14.7922 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4378.69 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 39.3219 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 2 + - 3374.36 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 3922.51 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 1359.35 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 4 + - 831.384 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 1 + - 4049.19 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 6 + - 51.5262 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 1623.91 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 2 + - 3128.25 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4088.11 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4351.11 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 2 + - 2813.9 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3337.32 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 4 + - 3357.67 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4431.33 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 67.3512 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 152.321 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 2349.08 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3386.08 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4445.62 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4382.58 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 0 + - 3199.33 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2971.89 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 853.861 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4384.3 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3948.31 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 645.771 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 29.3082 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4428.83 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 2641.57 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 2 + - 2874.36 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 85.644 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 52.3054 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 3949.66 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 4 + - 3272.76 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 2981.91 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 620.645 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3675.33 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4272.82 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 2151.66 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3446.87 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4081.81 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 4 + - 1806.81 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4348.63 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 126.157 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 2 + - 3439.18 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 7 + - 65.8728 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 7 + - 168.352 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 3955.31 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 2599.16 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 0 + - 3365.12 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4156.25 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 2183.88 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 0.16435 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1817.93 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3986.34 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4467.96 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 3323.07 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4362.75 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 167.985 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 3277.24 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4483.15 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 1 + - 3683.72 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3648.54 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 3 + - 56.6186 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4538.21 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1808.61 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 51.385 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 2136.28 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 3367.09 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4466.18 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4267.7 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 2346.94 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 0 + - 3496.13 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 175.394 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 2106.71 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 3802.5 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2.81138 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3893.42 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 2062.51 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4021.01 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 108.985 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 2997.83 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 3414.13 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 3535.97 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 37.1752 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 2 + - 3608.27 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 3301.8 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 2 + - 3276.15 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 5.68895 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 236.913 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 685.472 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 2815.43 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 3158.4 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4449.21 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 1194.04 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 201.767 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3995.15 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 4 + - 2110.15 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 77.2071 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 3346.02 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 102.376 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4446.59 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 1272.63 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4447.08 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 2 + - 3590.81 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 3653.6 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 2 + - 2350.19 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3925.01 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 2841.71 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3496.59 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 3892.82 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 6 + - 66.4303 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 3841.0 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3700.87 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 67.3682 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 3359.0 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4303.35 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 4 + - 2261.43 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3545.66 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 2917.28 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2408.59 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 311.499 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 113.959 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 28.9247 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 2 + - 3122.59 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 4 + - 2270.31 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 5.19179 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2878.7 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 810.993 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 3406.1 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4303.8 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 88.8763 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 4354.35 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3647.79 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 88.0468 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 1797.57 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 3546.49 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 4 + - 2842.82 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2272.66 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1603.22 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4248.6 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 2 + - 3105.96 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 158.977 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 1 + - 3789.53 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 13.8983 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 1844.45 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4352.84 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4156.79 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 1558.33 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4201.32 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 4 + - 2526.34 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 6 + - 131.646 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4164.88 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4187.25 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 3955.06 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 2 + - 2990.22 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 2 + - 2332.57 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 19.1452 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 2 + - 2036.99 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 1 + - 4131.84 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 2 + - 2340.12 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4059.02 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 1081.89 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4409.11 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 1 + - 4053.36 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 2125.25 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 829.328 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1199.94 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 2 + - 3186.05 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3064.83 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3658.24 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4318.46 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3774.09 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 1216.52 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2450.68 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 2229.66 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 0 + - 3632.48 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 1278.57 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3033.67 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4229.1 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3960.26 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 8.81501 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 1555.19 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 6 + - 187.576 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 3593.47 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4309.56 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4241.55 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4438.11 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 0.174666 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 354.956 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3946.94 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 5.61614 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 939.016 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 51.8841 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2602.33 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 3935.01 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 11.1859 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 2 + - 3277.53 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 1177.61 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 3337.25 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 2 + - 2596.29 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 3139.9 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 38.8583 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 4 + - 3334.39 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2106.64 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1396.15 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 3808.46 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4268.92 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 5 + - 4099.11 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 0 + - 3782.42 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 3928.11 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4421.71 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 6 + - 182.008 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4304.59 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4363.64 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 0 + - 3039.91 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 856.058 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 2103.1 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 3918.06 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 123.857 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4444.23 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 4 + - 2969.4 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 3903.79 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 4 + - 1693.52 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4175.34 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 3720.08 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 4035.78 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 1228.64 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 11.0129 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 5 + - 3953.81 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 3985.78 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 1925.05 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 3010.0 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 309.78 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3735.58 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4027.83 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 3636.0 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 93.6675 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2399.17 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3423.39 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3767.34 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 0 + - 2839.1 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 6 + - 193.705 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 1630.78 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4522.67 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 6 + - 146.003 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 3335.1 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 4 + - 3345.53 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1398.58 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 2315.01 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3727.86 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4447.64 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4193.48 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3535.31 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 1 + - 3783.23 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4293.49 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 4022.27 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3177.71 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 2846.98 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3475.39 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 2 + - 2576.59 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3718.73 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4304.38 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4318.24 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 10.3916 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 683.982 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4161.2 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4475.37 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 3254.98 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4534.9 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4294.38 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4213.48 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2528.34 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4497.43 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 0 + - 3206.99 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 299.391 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 5.5019 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 136.946 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4211.69 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4157.48 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 78.2187 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4210.24 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 4 + - 2094.36 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4166.93 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 5 + - 3897.19 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 2736.65 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4272.96 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 6 + - 81.3897 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 1640.78 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3594.0 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3111.99 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 1924.71 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 170.244 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 6 + - 167.88 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4174.21 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2483.92 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 1625.03 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 4 + - 2454.36 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 8.53043 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4196.47 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 622.67 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3337.02 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 2414.36 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 3958.29 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4525.65 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 99.0835 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 3725.24 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4236.78 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 2851.2 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 65.8084 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 622.464 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 4 + - 1368.6 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3636.78 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 0 + - 3329.6 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 1 + - 3788.13 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 3390.79 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4287.42 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 2.16568 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 0 + - 3715.85 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2090.83 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4215.1 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 81.9089 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 55.3903 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4159.21 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3842.26 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 4 + - 2501.76 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 2268.93 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4132.9 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 2308.35 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4086.19 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4012.17 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4404.48 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4455.05 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4354.7 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2862.5 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 1230.09 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 1 + - 3902.67 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4478.32 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4202.39 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 2.74515 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 2892.5 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 2817.72 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1681.35 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3544.68 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 1 + - 3731.44 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2227.05 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 343.249 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4275.42 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 271.006 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 0 + - 3656.22 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3691.99 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4290.75 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3922.54 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3839.83 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 2 + - 3432.95 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4393.5 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 3817.28 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3971.4 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 3899.05 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 470.339 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 27.9471 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3766.7 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 3917.02 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4152.14 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3593.62 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2017.14 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 4 + - 2020.69 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 2.80058 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 1 + - 4055.39 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4432.52 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 4 + - 2152.54 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 4 + - 2459.64 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 3892.22 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3729.64 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 1910.26 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4154.37 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 52.7318 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 936.403 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 100.369 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 3453.74 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1168.07 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 1 + - 4206.35 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4363.46 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4149.06 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 3035.07 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 6 + - 117.699 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 2 + - 3160.31 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1996.14 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4131.38 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 3837.64 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 2.66246 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 2814.43 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 4 + - 641.081 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 680.725 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4501.36 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4116.91 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 3108.16 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 2984.26 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 3958.02 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 3645.34 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2756.23 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 2914.11 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4387.15 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 4 + - 2732.26 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 1024.58 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 1411.08 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4338.48 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3471.7 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 3846.09 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4396.05 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 4 + - 2400.4 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3138.11 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 21.1136 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 2 + - 3439.41 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 2729.96 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 2 + - 2796.96 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 3697.35 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 0 + - 3373.74 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4211.32 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4269.1 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4192.47 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 4 + - 2932.38 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 3438.33 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4548.6 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 4 + - 3102.51 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 2397.8 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 36.8767 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 1 + - 4029.1 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 3916.04 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 4 + - 1307.18 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 4 + - 3336.43 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 1407.1 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4386.99 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4401.13 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 3134.45 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 3216.63 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 1999.7 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 0 + - 3818.03 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 1924.43 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 1 + - 3975.58 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 2 + - 2854.58 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4321.86 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 2 + - 2709.33 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 2011.24 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 2 + - 3140.85 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 6 + - 27.7227 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 2968.87 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4055.79 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3921.39 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 1772.15 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 119.71 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 425.978 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 2732.52 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 855.437 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 2 + - 3160.79 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4271.18 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4351.49 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3582.75 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 2 + - 2330.02 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 4202.58 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4381.18 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 2187.79 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 27.1515 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1835.59 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3805.24 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 4 + - 1477.3 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4424.26 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 2 + - 3441.37 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 2.17143 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 3947.1 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4344.96 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 1922.23 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 204.405 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4346.81 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4192.06 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 5 + - 3864.22 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 53.1812 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 3822.01 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 3952.49 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 4 + - 2880.04 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 4296.1 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3722.34 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 44.113 +- null diff --git a/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml b/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml new file mode 100644 index 000000000..4a1e8ca4b --- /dev/null +++ b/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml @@ -0,0 +1,11955 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x8_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 32 + LSPA: 16 + LSPB: 8 + LVCA: 16 + LVCB: 32 + LVPA: 16 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x16_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2944 + - - 1 + - 2154.74 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 4288 + - - 1 + - 3395.96 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 2944 + - - 3 + - 4435.68 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 6784 + - - 3 + - 4355.31 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 3584 + - - 1 + - 3460.65 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 128 + - - 1 + - 563.38 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 64 + - - 0 + - 1047.26 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 448 + - - 1 + - 2796.91 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 64 + - - 0 + - 1789.11 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 5056 + - - 3 + - 4344.79 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1856 + - - 6 + - 66.4662 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 2944 + - - 3 + - 3632.79 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 256 + - - 3 + - 3683.52 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 448 + - - 4 + - 4079.75 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 256 + - 4 + - - 6 + - 21.32 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 6784 + - - 3 + - 4200.4 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 768 + - 2368 + - - 1 + - 2651.61 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 128 + - - 1 + - 2051.18 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 6784 + - - 3 + - 3262.44 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 2944 + - - 3 + - 4280.36 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 5056 + - - 3 + - 4263.55 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1024 + - - 3 + - 3688.25 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 768 + - 2368 + - - 1 + - 2050.12 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3584 + - - 4 + - 3622.95 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 448 + - - 4 + - 2802.9 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 64 + - - 0 + - 2268.1 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 128 + - - 1 + - 2796.16 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 3584 + - - 3 + - 3371.91 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 2368 + - - 3 + - 4182.54 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 5056 + - - 2 + - 3967.01 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 6784 + - - 3 + - 4529.68 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 128 + - - 1 + - 3294.07 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 5888 + - - 3 + - 4480.88 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 448 + - - 5 + - 283.064 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 5056 + - - 3 + - 4030.58 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 448 + - - 1 + - 2803.5 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 5888 + - - 3 + - 4316.92 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 704 + - - 2 + - 3809.33 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 448 + - - 1 + - 2430.17 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1024 + - - 0 + - 2632.78 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 4 + - - 7 + - 196.963 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 64 + - - 0 + - 1515.86 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1408 + - - 1 + - 3407.32 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 4 + - - 7 + - 108.621 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 5056 + - - 1 + - 2405.19 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 6784 + - - 3 + - 4201.43 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 704 + - - 5 + - 442.372 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 5056 + - - 3 + - 3769.15 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 2944 + - - 3 + - 3841.79 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 128 + - - 1 + - 3201.65 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1408 + - - 1 + - 3268.26 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 5056 + - - 3 + - 4273.39 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 704 + - - 0 + - 2570.23 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 3584 + - - 3 + - 4159.05 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 768 + - 256 + - - 1 + - 1024.45 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 448 + - - 1 + - 2223.13 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 64 + - - 1 + - 807.878 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 6784 + - - 3 + - 4452.55 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 768 + - 5056 + - - 1 + - 3104.49 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 256 + - - 0 + - 2556.74 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1408 + - - 3 + - 3671.17 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 6784 + - - 3 + - 3805.38 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 64 + - - 1 + - 1642.21 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 256 + - 3584 + - - 6 + - 99.3833 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 3584 + - - 3 + - 3868.8 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 4 + - - 7 + - 83.3113 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1856 + - - 1 + - 2938.77 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 3584 + - - 3 + - 4203.01 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1024 + - - 3 + - 3052.73 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 128 + - - 1 + - 2875.24 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 704 + - - 5 + - 453.438 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1856 + - - 3 + - 4139.24 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 2368 + - - 3 + - 4214.64 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 256 + - - 1 + - 1953.0 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 2368 + - - 1 + - 2253.96 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 4288 + - - 1 + - 2882.61 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 5056 + - - 3 + - 4357.58 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 5056 + - - 1 + - 3385.32 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 5888 + - - 3 + - 3988.22 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1408 + - - 1 + - 1139.91 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 768 + - 5888 + - - 1 + - 2489.62 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 448 + - - 0 + - 1116.51 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 5056 + - - 3 + - 3883.79 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 64 + - - 1 + - 2524.95 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 256 + - 6784 + - - 1 + - 2136.61 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 6784 + - - 3 + - 4405.78 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 256 + - 2944 + - - 3 + - 2845.48 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 5888 + - - 3 + - 4403.69 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1856 + - - 3 + - 4191.92 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 2944 + - - 3 + - 4390.73 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 256 + - 64 + - - 5 + - 326.246 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1856 + - - 1 + - 1428.09 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 4 + - - 6 + - 29.8564 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 704 + - - 6 + - 29.2582 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 768 + - 4 + - - 6 + - 2.64714 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 6784 + - - 3 + - 4454.39 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 256 + - - 1 + - 2754.04 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 256 + - 64 + - - 5 + - 28.3993 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 448 + - - 0 + - 1154.0 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 6784 + - - 6 + - 217.039 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1856 + - - 1 + - 2305.79 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 5056 + - - 3 + - 4215.33 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 4 + - - 6 + - 5.61868 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1856 + - - 1 + - 805.999 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 5056 + - - 3 + - 4366.75 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 4 + - - 6 + - 5.69236 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1408 + - - 0 + - 2556.93 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 4 + - - 6 + - 19.7227 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 256 + - 5888 + - - 6 + - 148.555 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 768 + - 2368 + - - 3 + - 3502.76 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 64 + - - 1 + - 1889.67 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 256 + - - 0 + - 1153.22 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 128 + - - 1 + - 1147.31 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 256 + - 4288 + - - 1 + - 1727.46 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 704 + - - 3 + - 2999.57 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 768 + - 128 + - - 5 + - 300.95 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1024 + - - 3 + - 3791.56 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 4 + - - 6 + - 65.8957 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 2944 + - - 3 + - 4313.69 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 64 + - - 0 + - 1150.65 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 768 + - 5056 + - - 1 + - 2165.45 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 2944 + - - 1 + - 3278.5 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 5056 + - - 3 + - 4129.32 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 256 + - - 1 + - 2650.31 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1024 + - - 6 + - 37.7779 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 3584 + - - 1 + - 3273.25 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 2368 + - - 3 + - 3527.53 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 4288 + - - 3 + - 4149.18 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 64 + - - 1 + - 2478.11 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 768 + - 6784 + - - 3 + - 4196.32 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 256 + - 6784 + - - 1 + - 2424.86 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 64 + - - 0 + - 905.795 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 4 + - - 6 + - 67.2541 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 2368 + - - 3 + - 4152.86 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1024 + - - 3 + - 3629.35 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 4288 + - - 3 + - 4342.31 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 5056 + - - 2 + - 4247.06 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 5888 + - - 6 + - 184.597 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1856 + - - 0 + - 1191.56 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1408 + - - 1 + - 2202.64 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 2368 + - - 2 + - 3783.67 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 704 + - - 1 + - 3339.36 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 256 + - - 1 + - 1784.73 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1856 + - - 3 + - 4155.4 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 2944 + - - 3 + - 3368.85 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3584 + - - 3 + - 4316.78 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1856 + - - 3 + - 3973.93 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 5056 + - - 3 + - 4380.56 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 4288 + - - 3 + - 4148.0 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 3584 + - - 3 + - 4110.84 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1408 + - - 6 + - 53.895 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 128 + - - 1 + - 1764.36 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 128 + - - 1 + - 2220.66 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 256 + - 5056 + - - 1 + - 1633.92 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 704 + - - 3 + - 3611.57 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 768 + - 5888 + - - 6 + - 170.719 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1024 + - - 3 + - 3225.04 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1024 + - - 5 + - 457.694 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 768 + - 4288 + - - 1 + - 2057.12 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 4 + - - 7 + - 223.457 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 5888 + - - 3 + - 4250.39 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 128 + - - 0 + - 879.499 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 2368 + - - 3 + - 3937.39 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 4 + - - 6 + - 113.235 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 768 + - 6784 + - - 3 + - 3632.54 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 4288 + - - 3 + - 4313.24 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 64 + - - 0 + - 2163.14 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 3584 + - - 3 + - 3946.79 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 6784 + - - 3 + - 3947.63 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 64 + - - 0 + - 1873.98 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1408 + - - 3 + - 4063.24 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 5888 + - - 3 + - 4438.31 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 5888 + - - 3 + - 3718.46 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 5888 + - - 6 + - 190.624 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 64 + - - 1 + - 3170.27 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 256 + - - 0 + - 2456.12 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 128 + - - 1 + - 3366.77 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1408 + - - 1 + - 2671.87 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 704 + - - 3 + - 3188.83 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 4 + - - 6 + - 11.4646 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 64 + - - 6 + - 2.82429 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 3584 + - - 3 + - 4280.85 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 4 + - - 7 + - 52.7304 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 704 + - - 4 + - 3360.57 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 5888 + - - 3 + - 3882.54 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 2944 + - - 3 + - 3645.67 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1856 + - - 3 + - 3918.49 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1024 + - - 3 + - 4171.13 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1408 + - - 1 + - 2632.03 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 4288 + - - 3 + - 4386.84 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 704 + - - 6 + - 26.0074 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 2944 + - - 3 + - 4366.27 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 2368 + - - 3 + - 4206.26 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 704 + - - 1 + - 3224.87 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1408 + - - 0 + - 905.46 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 128 + - - 0 + - 1312.42 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 256 + - 128 + - - 6 + - 4.46839 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 448 + - - 4 + - 3421.36 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 4288 + - - 3 + - 4161.56 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 3584 + - - 3 + - 4188.77 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 3584 + - - 0 + - 2058.72 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1024 + - - 0 + - 2831.34 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 6784 + - - 3 + - 4011.74 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 4 + - - 6 + - 2.8399 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 2944 + - - 1 + - 3386.7 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1856 + - - 3 + - 4075.24 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 6784 + - - 1 + - 3769.89 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 6784 + - - 1 + - 3287.92 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 256 + - - 0 + - 2245.04 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 448 + - - 0 + - 2319.18 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 256 + - - 6 + - 11.2366 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 64 + - - 5 + - 81.0254 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 2368 + - - 3 + - 4142.46 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 128 + - - 1 + - 1157.94 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 256 + - 704 + - - 1 + - 1667.69 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1856 + - - 6 + - 68.0864 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 5056 + - - 3 + - 4399.76 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 256 + - 3584 + - - 1 + - 1347.79 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 3584 + - - 2 + - 3825.81 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 256 + - 4288 + - - 3 + - 3467.81 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3584 + - - 1 + - 3418.17 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 256 + - 4 + - - 6 + - 2.22489 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 6784 + - - 3 + - 4509.88 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1856 + - - 3 + - 3814.77 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 768 + - 704 + - - 6 + - 27.5237 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1856 + - - 3 + - 4192.73 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 256 + - - 5 + - 161.14 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1856 + - - 3 + - 3956.52 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 448 + - - 6 + - 18.1699 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1856 + - - 3 + - 4267.85 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 4288 + - - 3 + - 4357.6 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 2944 + - - 3 + - 4385.67 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 64 + - - 1 + - 2878.51 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 4288 + - - 3 + - 3966.55 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1856 + - - 3 + - 3308.7 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 704 + - - 1 + - 2620.62 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 256 + - 3584 + - - 3 + - 3432.35 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 768 + - 4288 + - - 6 + - 128.768 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 5888 + - - 3 + - 3368.33 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 64 + - - 5 + - 282.931 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 2944 + - - 3 + - 2877.95 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 704 + - - 1 + - 3410.53 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 5888 + - - 3 + - 4458.44 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1024 + - - 2 + - 3307.91 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 5888 + - - 1 + - 2883.0 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 2368 + - - 3 + - 4225.4 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1408 + - - 3 + - 4199.74 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 6784 + - - 1 + - 3327.96 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 5888 + - - 3 + - 4401.63 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 4 + - - 7 + - 124.978 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 3584 + - - 3 + - 4393.06 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 704 + - - 0 + - 1721.69 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 704 + - - 0 + - 1793.65 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 256 + - 6784 + - - 3 + - 3040.5 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 3584 + - - 3 + - 4272.38 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1856 + - - 2 + - 3903.7 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 256 + - 704 + - - 1 + - 629.146 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 768 + - 2944 + - - 1 + - 2670.33 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 3584 + - - 3 + - 4352.16 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 2944 + - - 3 + - 4291.83 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 4 + - - 6 + - 0.181889 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 256 + - 3584 + - - 3 + - 3070.9 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1024 + - - 1 + - 1932.18 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 128 + - - 1 + - 2100.19 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 3584 + - - 2 + - 4045.95 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 5056 + - - 3 + - 3925.5 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 2368 + - - 1 + - 2791.14 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 2368 + - - 1 + - 3488.93 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 2368 + - - 3 + - 3659.21 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 2944 + - - 1 + - 3424.01 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 6784 + - - 3 + - 4288.98 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 704 + - - 0 + - 878.708 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 128 + - - 1 + - 2937.36 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 128 + - - 1 + - 3026.12 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1024 + - - 2 + - 3436.13 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 5888 + - - 1 + - 2773.74 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 256 + - 6784 + - - 6 + - 165.233 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 768 + - 448 + - - 1 + - 1712.88 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 768 + - 4 + - - 6 + - 0.162793 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 768 + - 128 + - - 5 + - 75.5218 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 448 + - - 4 + - 4021.56 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 4288 + - - 6 + - 142.555 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1856 + - - 0 + - 1149.13 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 5056 + - - 3 + - 4204.4 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 768 + - 3584 + - - 3 + - 3726.1 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1856 + - - 0 + - 2190.11 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 4 + - - 6 + - 29.0197 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1024 + - - 3 + - 4013.7 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 2368 + - - 3 + - 4340.68 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1408 + - - 1 + - 2736.93 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1408 + - - 3 + - 3850.38 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 3584 + - - 3 + - 4344.8 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 256 + - - 1 + - 2024.05 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 5056 + - - 3 + - 4159.28 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 4 + - - 6 + - 65.3819 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 5888 + - - 3 + - 4019.57 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 6784 + - - 2 + - 3444.28 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 6784 + - - 3 + - 4364.07 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 448 + - - 5 + - 291.058 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 4288 + - - 3 + - 4339.01 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 1 + - 2126.49 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 256 + - 4 + - - 7 + - 0.128731 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 256 + - 5056 + - - 1 + - 1880.73 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 704 + - - 1 + - 2429.39 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 5056 + - - 2 + - 4006.44 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 704 + - - 3 + - 3701.68 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 3584 + - - 1 + - 2553.65 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 704 + - - 0 + - 2044.13 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 2944 + - - 3 + - 4345.89 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 704 + - - 4 + - 2876.54 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 5056 + - - 3 + - 4164.94 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 6784 + - - 3 + - 3831.27 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 704 + - - 2 + - 4035.03 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 4 + - - 7 + - 68.8263 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 5 + - 240.095 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 128 + - - 6 + - 5.67092 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 448 + - - 1 + - 2937.04 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 768 + - 256 + - - 1 + - 591.71 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 704 + - - 3 + - 3574.11 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 2944 + - - 1 + - 3225.64 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 768 + - 128 + - - 6 + - 5.38123 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1856 + - - 1 + - 3839.58 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 768 + - 2368 + - - 0 + - 1313.72 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1024 + - - 4 + - 1993.81 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 768 + - 2944 + - - 1 + - 3168.14 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 256 + - - 3 + - 3871.85 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 4288 + - - 3 + - 3935.49 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 5056 + - - 6 + - 161.735 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 2368 + - - 6 + - 83.9317 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 768 + - 64 + - - 5 + - 36.7607 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 256 + - 5888 + - - 3 + - 3569.55 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 448 + - - 1 + - 3436.67 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 128 + - - 5 + - 579.833 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 4288 + - - 3 + - 4081.96 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 448 + - - 0 + - 1876.64 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 768 + - 3584 + - - 6 + - 113.916 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1856 + - - 1 + - 3468.52 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 2368 + - - 4 + - 3200.91 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 4288 + - - 3 + - 3757.2 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 3584 + - - 3 + - 4462.71 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1024 + - - 0 + - 1148.01 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 2368 + - - 3 + - 4286.56 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 5056 + - - 3 + - 4019.88 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 256 + - - 3 + - 2874.91 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 704 + - - 3 + - 3642.1 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1408 + - - 3 + - 4126.68 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 4288 + - - 3 + - 4202.98 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1408 + - - 1 + - 2430.78 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 2944 + - - 0 + - 1866.99 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 704 + - - 3 + - 3763.87 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 256 + - - 3 + - 2905.69 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1024 + - - 2 + - 3822.56 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 768 + - 3584 + - - 3 + - 3431.96 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 4 + - - 7 + - 39.5375 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 5888 + - - 3 + - 4507.94 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1408 + - - 3 + - 3898.93 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 4 + - - 7 + - 170.756 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 4288 + - - 3 + - 3374.76 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1024 + - - 1 + - 2216.42 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 5888 + - - 3 + - 3930.65 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 4 + - - 7 + - 104.183 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 4288 + - - 3 + - 4125.72 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 3 + - 2160.26 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 256 + - 64 + - - 5 + - 60.2538 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 4288 + - - 3 + - 4027.28 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1408 + - - 3 + - 4378.95 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 704 + - - 1 + - 3286.15 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 6784 + - - 3 + - 4441.24 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 256 + - - 1 + - 2678.37 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 2944 + - - 1 + - 2942.25 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1408 + - - 0 + - 2341.96 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1408 + - - 2 + - 3788.99 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 4 + - - 6 + - 165.457 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 64 + - - 1 + - 2035.75 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 448 + - - 3 + - 3555.74 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 768 + - 448 + - - 1 + - 2130.93 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1024 + - - 2 + - 3852.56 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 128 + - - 0 + - 2379.48 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 448 + - - 1 + - 2311.36 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1024 + - - 3 + - 3391.1 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1856 + - - 3 + - 4096.69 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 768 + - 5056 + - - 1 + - 3324.43 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1024 + - - 3 + - 3658.76 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 5888 + - - 3 + - 3321.44 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 6784 + - - 3 + - 4481.65 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1856 + - - 2 + - 3841.78 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 128 + - - 0 + - 907.989 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 64 + - - 6 + - 2.86677 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1856 + - - 3 + - 4256.24 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1856 + - - 0 + - 2321.69 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 128 + - - 0 + - 2351.94 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 5888 + - - 3 + - 4275.32 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 6784 + - - 3 + - 4392.73 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 4288 + - - 3 + - 4299.86 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 3584 + - - 3 + - 3221.43 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3584 + - - 3 + - 3588.19 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 448 + - - 5 + - 562.969 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 4288 + - - 3 + - 4427.91 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 64 + - - 0 + - 1596.37 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 5888 + - - 3 + - 4218.99 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 5888 + - - 3 + - 4304.8 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 5888 + - - 3 + - 4437.87 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 6784 + - - 3 + - 4338.36 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1408 + - - 3 + - 3827.09 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 448 + - - 1 + - 3028.48 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 256 + - 64 + - - 6 + - 2.16149 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1024 + - - 0 + - 638.116 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 1 + - 1341.46 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1856 + - - 1 + - 3411.8 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1024 + - - 0 + - 2910.08 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 3584 + - - 3 + - 4178.57 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 256 + - - 5 + - 332.227 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 448 + - - 4 + - 2810.12 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 3584 + - - 6 + - 123.305 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 2944 + - - 3 + - 4444.42 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1408 + - - 2 + - 3620.41 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 2944 + - - 3 + - 4076.08 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 64 + - - 1 + - 2116.94 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 6784 + - - 3 + - 4328.78 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 768 + - 4288 + - - 1 + - 1858.11 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 2944 + - - 3 + - 3991.41 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 2368 + - - 1 + - 3708.14 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 128 + - - 1 + - 2245.11 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1024 + - - 3 + - 2700.83 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 5888 + - - 3 + - 4276.37 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 2368 + - - 3 + - 3016.98 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1856 + - - 3 + - 3731.14 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 448 + - - 1 + - 2661.12 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 4 + - - 7 + - 85.9565 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1408 + - - 1 + - 3733.82 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 5056 + - - 3 + - 4364.35 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 2368 + - - 1 + - 2735.93 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 128 + - - 5 + - 166.376 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 64 + - - 1 + - 1375.05 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 448 + - - 0 + - 1994.96 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 448 + - - 1 + - 3443.81 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 768 + - 2944 + - - 0 + - 1573.23 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 5888 + - - 3 + - 4441.27 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 128 + - - 0 + - 2617.79 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 448 + - - 1 + - 3156.3 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 6784 + - - 3 + - 4531.67 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 3 + - 2830.44 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 6784 + - - 4 + - 4117.82 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 3584 + - - 3 + - 4293.3 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1408 + - - 3 + - 3546.49 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 64 + - - 1 + - 2763.14 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 4288 + - - 3 + - 4133.48 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 4288 + - - 1 + - 2202.56 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 256 + - - 1 + - 3292.65 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 5056 + - - 1 + - 3501.38 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 128 + - - 0 + - 1720.96 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 4288 + - - 1 + - 2042.56 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 64 + - - 5 + - 166.351 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 448 + - - 1 + - 3241.75 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1408 + - - 3 + - 4351.92 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3584 + - - 3 + - 4394.14 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 5888 + - - 3 + - 3308.3 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 2944 + - - 3 + - 4068.2 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 768 + - 4288 + - - 3 + - 4005.9 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 4 + - - 7 + - 136.649 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 256 + - - 3 + - 3829.56 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 448 + - - 1 + - 3166.23 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1856 + - - 1 + - 3624.69 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1856 + - - 3 + - 4288.33 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 768 + - 64 + - - 5 + - 150.841 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 768 + - 448 + - - 5 + - 519.604 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 6 + - 8.79919 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 6784 + - - 3 + - 4298.42 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 6784 + - - 1 + - 3202.64 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 64 + - - 1 + - 1403.59 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 2944 + - - 3 + - 4116.11 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1408 + - - 3 + - 3711.2 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 4 + - - 6 + - 11.2377 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 768 + - 704 + - - 5 + - 410.612 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 3584 + - - 3 + - 4387.93 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 5056 + - - 3 + - 4199.27 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1408 + - - 3 + - 3994.37 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1856 + - - 3 + - 3151.49 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 256 + - - 0 + - 1795.36 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 768 + - 4288 + - - 1 + - 3254.01 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 3 + - 3261.16 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 704 + - - 3 + - 3820.11 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 128 + - - 5 + - 162.165 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1856 + - - 1 + - 2355.49 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 448 + - - 5 + - 579.608 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 5056 + - - 3 + - 4326.41 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 5888 + - - 1 + - 2832.47 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 2944 + - - 3 + - 3752.01 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 64 + - - 1 + - 1853.75 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 704 + - - 0 + - 2894.85 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 5888 + - - 3 + - 3967.7 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 256 + - 2368 + - - 3 + - 3043.14 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 5888 + - - 3 + - 4472.33 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 768 + - 704 + - - 1 + - 1556.73 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3584 + - - 0 + - 2208.54 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1408 + - - 1 + - 1822.75 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1408 + - - 1 + - 3222.35 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 4 + - - 6 + - 67.8188 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 4288 + - - 6 + - 137.86 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 256 + - 5056 + - - 6 + - 131.077 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 2944 + - - 6 + - 103.457 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1408 + - - 1 + - 1530.75 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 768 + - 5888 + - - 3 + - 3654.22 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1408 + - - 3 + - 3917.14 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1024 + - - 3 + - 3870.36 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 768 + - 256 + - - 5 + - 300.452 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 448 + - - 1 + - 3564.29 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1408 + - - 3 + - 3759.39 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 5056 + - - 3 + - 4285.16 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3584 + - - 3 + - 4206.14 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1408 + - - 3 + - 3819.55 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 6784 + - - 3 + - 4324.94 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 768 + - 704 + - - 1 + - 2135.64 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 5056 + - - 2 + - 4053.83 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 768 + - 2944 + - - 1 + - 3131.01 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 2944 + - - 1 + - 3257.82 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1856 + - - 3 + - 4110.16 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 128 + - - 1 + - 2858.72 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 5888 + - - 3 + - 4275.95 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 256 + - 4288 + - - 1 + - 1406.59 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3584 + - - 6 + - 127.765 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 3584 + - - 3 + - 4345.22 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 768 + - 64 + - - 6 + - 2.65114 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 448 + - - 4 + - 3319.44 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 256 + - 4288 + - - 7 + - 117.968 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 64 + - - 5 + - 290.76 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 768 + - 4 + - - 6 + - 28.0045 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3584 + - - 3 + - 4403.41 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 64 + - - 5 + - 41.3845 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 256 + - - 1 + - 1119.3 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 768 + - 6784 + - - 1 + - 3021.96 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 448 + - - 1 + - 2768.48 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 2944 + - - 1 + - 2893.54 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 704 + - - 3 + - 3722.59 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1856 + - - 3 + - 3831.57 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1856 + - - 7 + - 51.5633 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 6784 + - - 3 + - 4494.2 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 4288 + - - 3 + - 4388.73 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1856 + - - 3 + - 3932.71 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 3584 + - - 3 + - 3716.55 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1856 + - - 6 + - 66.9334 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 2368 + - - 0 + - 1512.88 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 4 + - - 7 + - 87.2041 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 768 + - 4288 + - - 1 + - 2672.27 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 64 + - - 1 + - 2176.07 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 768 + - 4 + - - 6 + - 18.4202 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1856 + - - 3 + - 3773.76 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 2368 + - - 3 + - 4150.48 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 256 + - 2368 + - - 1 + - 2298.21 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 2944 + - - 3 + - 4395.25 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 448 + - - 1 + - 3502.67 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 768 + - 448 + - - 1 + - 1026.23 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 64 + - - 0 + - 1192.75 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 6784 + - - 3 + - 4457.05 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 1 + - 462.199 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 5056 + - - 3 + - 4343.29 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1024 + - - 3 + - 3181.8 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 2368 + - - 0 + - 1454.32 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1024 + - - 0 + - 2097.66 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1024 + - - 3 + - 3544.83 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 64 + - - 5 + - 443.72 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 256 + - 3584 + - - 1 + - 2193.89 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 128 + - - 1 + - 1884.75 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1408 + - - 1 + - 3090.16 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 4 + - - 6 + - 2.79002 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 6784 + - - 3 + - 4277.7 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 5888 + - - 4 + - 3893.72 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 3584 + - - 3 + - 4350.85 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 128 + - - 1 + - 83.1338 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 704 + - - 4 + - 3919.43 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 64 + - - 1 + - 1177.29 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 1829.26 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1024 + - - 1 + - 860.077 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 5056 + - - 3 + - 4298.08 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 2368 + - - 6 + - 86.665 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 768 + - 64 + - - 5 + - 262.711 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 768 + - 704 + - - 1 + - 810.047 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 2944 + - - 3 + - 3957.59 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 128 + - - 1 + - 2439.91 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 2368 + - - 3 + - 3796.22 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 4 + - - 7 + - 171.703 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1856 + - - 3 + - 4022.8 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 5056 + - - 2 + - 4356.06 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1408 + - - 0 + - 874.976 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1856 + - - 3 + - 3945.17 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1024 + - - 0 + - 658.675 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 128 + - - 1 + - 2668.23 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1856 + - - 1 + - 3343.48 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 768 + - 3584 + - - 1 + - 2936.54 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1856 + - - 3 + - 3835.13 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3584 + - - 3 + - 4468.64 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 2944 + - - 6 + - 100.161 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1024 + - - 1 + - 2994.03 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 3584 + - - 3 + - 3860.0 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 256 + - - 5 + - 166.319 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 4288 + - - 3 + - 4320.23 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 2944 + - - 3 + - 4247.47 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 2944 + - - 2 + - 4252.54 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 6784 + - - 3 + - 4377.01 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 64 + - - 5 + - 640.287 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 768 + - 2368 + - - 0 + - 2243.37 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 448 + - - 3 + - 3483.07 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 256 + - 4288 + - - 3 + - 2916.79 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 3584 + - - 3 + - 3779.32 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 64 + - - 5 + - 588.133 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 5888 + - - 3 + - 4328.28 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1408 + - - 0 + - 1898.88 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 5888 + - - 3 + - 3826.4 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 2944 + - - 3 + - 4227.63 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 5056 + - - 0 + - 2480.79 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 2944 + - - 2 + - 3975.22 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1856 + - - 4 + - 4057.56 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 768 + - 128 + - - 5 + - 519.375 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1024 + - - 2 + - 3962.33 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 64 + - - 1 + - 814.054 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 448 + - - 6 + - 19.4174 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1024 + - - 1 + - 1988.33 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 5056 + - - 3 + - 4421.63 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 2944 + - - 3 + - 4185.69 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 704 + - - 1 + - 1143.07 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 6784 + - - 3 + - 3525.45 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 4 + - - 7 + - 147.386 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 768 + - 4 + - - 6 + - 5.32911 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 4288 + - - 3 + - 3757.16 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 6784 + - - 3 + - 4523.58 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 5056 + - - 3 + - 4171.11 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 128 + - - 1 + - 2254.56 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 2538.43 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 2368 + - - 3 + - 3912.09 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 256 + - - 5 + - 323.388 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 256 + - - 1 + - 3485.72 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 4288 + - - 3 + - 3929.0 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1408 + - - 1 + - 2787.95 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 128 + - - 0 + - 2244.3 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1024 + - - 0 + - 2396.86 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 2368 + - - 3 + - 3953.51 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1024 + - - 0 + - 2627.88 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 5056 + - - 3 + - 3717.74 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1856 + - - 1 + - 3142.24 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 2368 + - - 3 + - 3933.76 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 2944 + - - 1 + - 2790.8 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1408 + - - 3 + - 3307.07 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1856 + - - 3 + - 4151.1 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 2368 + - - 2 + - 3584.62 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 256 + - 5888 + - - 1 + - 2124.12 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 768 + - 448 + - - 5 + - 262.929 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 2368 + - - 3 + - 4188.53 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 6784 + - - 6 + - 210.086 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 448 + - - 4 + - 2939.18 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 128 + - - 1 + - 3058.55 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 4288 + - - 3 + - 4275.42 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 4288 + - - 3 + - 3787.32 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 5888 + - - 3 + - 4190.97 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 64 + - - 0 + - 1458.48 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 2944 + - - 3 + - 4432.94 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 704 + - - 1 + - 2579.92 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 768 + - 128 + - - 5 + - 151.353 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 6784 + - - 3 + - 3863.1 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 4288 + - - 3 + - 4337.39 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 768 + - 5888 + - - 1 + - 2668.49 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 256 + - 2368 + - - 1 + - 1547.44 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 2368 + - - 3 + - 3829.39 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 2368 + - - 2 + - 3727.92 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 5888 + - - 3 + - 4491.96 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1408 + - - 0 + - 1713.46 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 704 + - - 1 + - 2741.28 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 704 + - - 1 + - 3290.97 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 6784 + - - 3 + - 4281.9 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 256 + - 704 + - - 6 + - 20.9726 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 256 + - - 1 + - 3034.19 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 64 + - - 1 + - 2130.71 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1024 + - - 4 + - 3574.77 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 768 + - 64 + - - 5 + - 75.3625 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 704 + - - 1 + - 2115.46 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1024 + - - 3 + - 3061.58 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 5056 + - - 3 + - 3957.03 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 256 + - - 3 + - 3198.62 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 64 + - - 5 + - 454.192 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 256 + - 4 + - - 6 + - 4.40748 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 4 + - - 7 + - 153.371 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 128 + - - 0 + - 2554.01 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 768 + - 5056 + - - 6 + - 149.939 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 704 + - - 4 + - 3338.07 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 704 + - - 0 + - 906.525 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1408 + - - 6 + - 50.5587 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 5888 + - - 3 + - 4391.69 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 448 + - - 1 + - 3469.17 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 256 + - 5056 + - - 3 + - 2998.05 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 256 + - 704 + - - 5 + - 326.05 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1408 + - - 3 + - 3846.83 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 6784 + - - 3 + - 3914.34 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 4288 + - - 3 + - 4135.85 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1408 + - - 6 + - 39.3504 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1024 + - - 0 + - 2563.4 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 2944 + - - 3 + - 4435.01 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 64 + - - 0 + - 1315.78 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 6784 + - - 3 + - 4473.26 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 768 + - 5888 + - - 3 + - 3890.44 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1024 + - - 2 + - 3016.04 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 5056 + - - 3 + - 3962.72 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 128 + - - 5 + - 322.658 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 448 + - - 0 + - 1912.01 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 2368 + - - 3 + - 4017.84 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 5056 + - - 3 + - 3390.77 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1024 + - - 4 + - 3703.29 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 120.785 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 4288 + - - 3 + - 3948.44 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 2368 + - - 1 + - 3792.34 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3584 + - - 2 + - 4387.38 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 5888 + - - 1 + - 3643.62 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 64 + - - 1 + - 3299.67 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1856 + - - 3 + - 3588.19 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 5888 + - - 3 + - 4078.45 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 448 + - - 4 + - 3371.57 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 2944 + - - 3 + - 4360.64 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 4288 + - - 3 + - 4392.06 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1408 + - - 3 + - 4222.71 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 128 + - - 1 + - 2335.25 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 4 + - - 7 + - 69.5323 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 448 + - - 1 + - 2604.29 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1024 + - - 1 + - 1777.67 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 2368 + - - 3 + - 3944.55 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 2368 + - - 3 + - 3717.36 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 128 + - - 1 + - 2000.46 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3584 + - - 2 + - 4134.9 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 256 + - 704 + - - 1 + - 1607.26 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 128 + - - 0 + - 1794.73 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 4288 + - - 3 + - 3891.31 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1024 + - - 6 + - 37.5085 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 5888 + - - 3 + - 4452.59 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1408 + - - 0 + - 1787.18 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 5888 + - - 3 + - 4399.47 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 2368 + - - 3 + - 4136.05 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 256 + - - 3 + - 3369.85 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 5888 + - - 1 + - 2940.16 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 2368 + - - 3 + - 4231.33 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 4288 + - - 3 + - 4028.84 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 5056 + - - 3 + - 4216.8 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 704 + - - 4 + - 3892.0 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 4 + - - 7 + - 38.3811 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1856 + - - 0 + - 1040.26 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 2944 + - - 1 + - 3366.31 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 128 + - - 1 + - 2145.79 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 4 + - - 7 + - 102.605 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 768 + - 128 + - - 1 + - 810.35 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 4 + - - 6 + - 18.9098 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 6784 + - - 3 + - 4352.76 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1024 + - - 2 + - 4065.99 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 4 + - - 7 + - 77.9339 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 3584 + - - 3 + - 4095.15 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1408 + - - 1 + - 622.088 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 2368 + - - 0 + - 2457.6 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1408 + - - 1 + - 2750.56 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 256 + - - 1 + - 2935.6 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1408 + - - 3 + - 3960.42 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4288 + - - 1 + - 2239.41 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 2944 + - - 1 + - 3643.5 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1856 + - - 1 + - 3158.62 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 768 + - 2368 + - - 6 + - 79.264 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 5888 + - - 3 + - 4031.4 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 4 + - - 6 + - 130.742 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 256 + - 448 + - - 5 + - 409.783 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 4288 + - - 3 + - 4343.32 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 6784 + - - 3 + - 4176.74 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 2944 + - - 1 + - 2866.03 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1408 + - - 3 + - 3994.72 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 5056 + - - 0 + - 2027.3 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1024 + - - 0 + - 1307.58 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5888 + - - 3 + - 2800.1 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1408 + - - 3 + - 4045.44 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 5056 + - - 3 + - 4350.88 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 256 + - 2368 + - - 6 + - 66.1994 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 5888 + - - 3 + - 4429.75 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 704 + - - 1 + - 2347.83 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 4 + - - 7 + - 122.606 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 128 + - - 1 + - 3461.28 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1408 + - - 3 + - 3862.9 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 6784 + - - 3 + - 4314.95 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 1 + - 1820.64 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5056 + - - 1 + - 2554.51 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 256 + - 128 + - - 5 + - 121.72 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 128 + - - 1 + - 2526.01 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1856 + - - 3 + - 3500.14 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 768 + - 2944 + - - 6 + - 94.8458 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1024 + - - 6 + - 36.9641 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 5888 + - - 3 + - 4039.62 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1024 + - - 2 + - 3926.58 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 448 + - - 1 + - 3360.46 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 448 + - - 1 + - 3478.69 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 5056 + - - 3 + - 4168.09 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1408 + - - 0 + - 2497.16 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1024 + - - 1 + - 1348.94 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1024 + - - 0 + - 1267.05 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 256 + - 2944 + - - 1 + - 1897.6 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 256 + - - 3 + - 3324.55 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 128 + - - 1 + - 1431.49 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 256 + - 64 + - - 5 + - 209.508 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1024 + - - 2 + - 3402.08 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 4288 + - - 3 + - 4204.7 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 704 + - - 1 + - 3430.74 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 4288 + - - 3 + - 4275.31 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 256 + - - 0 + - 2715.65 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 4288 + - - 1 + - 2118.98 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 768 + - 3584 + - - 1 + - 3201.68 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1024 + - - 4 + - 3678.2 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 704 + - - 1 + - 2198.16 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 768 + - 704 + - - 1 + - 2032.08 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 5056 + - - 6 + - 167.361 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 3584 + - - 3 + - 4009.87 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 3584 + - - 3 + - 3550.13 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 4 + - - 6 + - 93.1657 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 64 + - - 1 + - 625.778 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 768 + - 256 + - - 5 + - 150.85 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 768 + - 6784 + - - 1 + - 2876.53 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 128 + - - 0 + - 2172.08 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 5888 + - - 3 + - 4365.81 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 704 + - - 1 + - 3414.8 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 5056 + - - 3 + - 4415.58 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 1 + - 2364.45 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 2368 + - - 1 + - 2334.79 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1856 + - - 3 + - 3915.17 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 5 + - 121.476 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1856 + - - 3 + - 3821.16 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 4 + - - 7 + - 110.438 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 256 + - 448 + - - 6 + - 14.6836 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 768 + - 5056 + - - 0 + - 2318.79 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 2368 + - - 3 + - 4253.26 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1408 + - - 3 + - 3893.27 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 704 + - - 2 + - 3972.1 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 3584 + - - 3 + - 4183.15 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1408 + - - 3 + - 3374.27 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1024 + - - 3 + - 3582.47 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1024 + - - 6 + - 28.1635 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1856 + - - 2 + - 3685.44 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 768 + - 2944 + - - 1 + - 2521.2 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 64 + - - 5 + - 457.361 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 2944 + - - 1 + - 3446.67 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 704 + - - 3 + - 3157.7 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 2368 + - - 3 + - 3922.4 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 448 + - - 3 + - 3285.84 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 448 + - - 0 + - 2552.36 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 256 + - 448 + - - 1 + - 1607.61 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 2368 + - - 3 + - 3584.07 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 4 + - - 6 + - 112.526 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 256 + - - 3 + - 2789.89 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 128 + - - 5 + - 241.237 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1024 + - - 3 + - 4244.32 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1408 + - - 3 + - 3673.84 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 704 + - - 1 + - 3131.21 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 4288 + - - 3 + - 4299.61 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 4 + - - 6 + - 54.0926 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1408 + - - 3 + - 4009.11 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 256 + - 2368 + - - 1 + - 995.008 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 256 + - 2944 + - - 6 + - 82.0988 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 6784 + - - 3 + - 4500.49 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1408 + - - 3 + - 2733.34 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 2368 + - - 3 + - 4265.14 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 1 + - 785.758 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1024 + - - 2 + - 4140.24 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 5888 + - - 3 + - 4052.4 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 6784 + - - 3 + - 4216.63 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 5056 + - - 1 + - 3308.61 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 4 + - - 7 + - 65.9487 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 768 + - 256 + - - 6 + - 10.6099 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 4 + - - 6 + - 0.175665 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 6784 + - - 3 + - 4508.17 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 448 + - - 4 + - 3847.66 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3584 + - - 1 + - 3566.32 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 256 + - - 1 + - 2856.33 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 768 + - 5056 + - - 2 + - 3796.24 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 6784 + - - 3 + - 4471.32 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 3584 + - - 3 + - 3822.56 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 4288 + - - 3 + - 3517.63 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 256 + - 4 + - - 6 + - 14.8355 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 5888 + - - 3 + - 4233.28 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 6784 + - - 3 + - 4521.13 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 4288 + - - 1 + - 2150.33 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 4288 + - - 1 + - 2825.53 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3584 + - - 3 + - 4209.29 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 2944 + - - 3 + - 4400.3 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 3584 + - - 3 + - 4403.99 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1408 + - - 3 + - 3640.71 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 768 + - 4 + - - 6 + - 10.6451 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 6784 + - - 1 + - 3379.92 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 128 + - - 0 + - 1265.85 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 4 + - - 6 + - 28.0971 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 2368 + - - 3 + - 4151.86 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 4 + - - 7 + - 88.5794 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1856 + - - 3 + - 4097.83 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1856 + - - 1 + - 2585.67 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 5056 + - - 3 + - 3928.11 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 5056 + - - 1 + - 3569.57 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 704 + - - 3 + - 2734.12 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1856 + - - 3 + - 4173.45 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 704 + - - 1 + - 3141.82 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1856 + - - 1 + - 3241.0 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 64 + - - 1 + - 992.157 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 256 + - 5888 + - - 1 + - 1851.0 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 256 + - 2944 + - - 1 + - 1177.91 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 64 + - - 0 + - 1901.56 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 6784 + - - 2 + - 3392.09 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1024 + - - 2 + - 3503.26 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 128 + - - 5 + - 81.121 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 128 + - - 1 + - 1543.66 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 5056 + - - 3 + - 4296.26 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 448 + - - 1 + - 3362.71 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1408 + - - 3 + - 4292.51 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1024 + - - 4 + - 3596.07 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 3584 + - - 3 + - 3841.89 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 768 + - 64 + - - 5 + - 411.106 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1856 + - - 1 + - 1928.73 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 2944 + - - 3 + - 3909.92 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 256 + - - 0 + - 2398.7 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 5056 + - - 3 + - 4365.58 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 128 + - - 5 + - 332.335 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 2368 + - - 3 + - 3861.85 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 768 + - 3584 + - - 0 + - 1809.28 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 256 + - 5056 + - - 3 + - 3416.57 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 256 + - 6784 + - - 3 + - 3932.03 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1856 + - - 3 + - 4231.93 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 256 + - 128 + - - 5 + - 409.052 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1856 + - - 3 + - 4117.65 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 256 + - - 1 + - 3617.52 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1856 + - - 1 + - 3144.43 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 768 + - 448 + - - 6 + - 18.1636 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 4288 + - - 3 + - 4207.4 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 1 + - 1145.19 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 256 + - - 1 + - 2422.28 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1856 + - - 3 + - 4044.97 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 6784 + - - 3 + - 4384.84 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 704 + - - 0 + - 2803.55 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 4288 + - - 1 + - 3677.55 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 4 + - - 6 + - 39.5061 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 5888 + - - 2 + - 4163.12 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 704 + - - 3 + - 3482.29 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 768 + - 6784 + - - 6 + - 193.206 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 256 + - - 1 + - 3395.77 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1408 + - - 0 + - 800.749 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 448 + - - 1 + - 3295.06 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 128 + - - 6 + - 5.72624 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 256 + - - 1 + - 643.054 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1024 + - - 4 + - 3307.55 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1856 + - - 3 + - 3282.0 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 2368 + - - 3 + - 4270.52 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1408 + - - 1 + - 2767.25 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 256 + - 2944 + - - 1 + - 2606.98 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 256 + - 5888 + - - 3 + - 3446.58 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 4 + - - 6 + - 39.9493 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 8.77248 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1024 + - - 4 + - 3119.75 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 5056 + - - 2 + - 4032.02 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 64 + - - 1 + - 39.961 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 2944 + - - 3 + - 4238.23 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 256 + - - 0 + - 2775.93 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 704 + - - 1 + - 2149.6 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 256 + - 448 + - - 5 + - 210.534 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 5888 + - - 3 + - 4055.65 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 128 + - - 1 + - 873.935 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 64 + - - 1 + - 2872.57 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 6784 + - - 3 + - 4483.32 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 2944 + - - 3 + - 4168.08 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 256 + - 128 + - - 1 + - 626.594 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 448 + - - 1 + - 3491.63 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 128 + - - 1 + - 1556.73 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 1 + - 2299.97 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 64 + - - 0 + - 876.647 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 64 + - - 5 + - 162.065 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1408 + - - 2 + - 3741.83 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 4 + - - 7 + - 67.6235 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1024 + - - 4 + - 3501.02 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 768 + - 6784 + - - 1 + - 3267.87 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 2944 + - - 3 + - 4145.54 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 5888 + - - 3 + - 3691.65 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 5888 + - - 3 + - 4174.5 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 256 + - - 0 + - 661.359 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1024 + - - 4 + - 3596.78 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2368 + - - 0 + - 1826.5 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 704 + - - 3 + - 3672.47 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 64 + - - 0 + - 657.616 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 2368 + - - 3 + - 4333.14 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 128 + - - 0 + - 1934.13 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 256 + - - 1 + - 3146.6 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 4288 + - - 3 + - 3830.79 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 64 + - - 1 + - 2395.97 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 4288 + - - 3 + - 3796.72 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1024 + - - 1 + - 3366.99 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 5056 + - - 0 + - 2579.78 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1408 + - - 6 + - 51.6518 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 4288 + - - 3 + - 4303.75 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 64 + - - 1 + - 83.2651 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 256 + - - 6 + - 11.3623 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1408 + - - 3 + - 3555.33 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 4 + - - 7 + - 53.5578 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 4288 + - - 1 + - 3437.27 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 704 + - - 4 + - 3809.03 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 4288 + - - 3 + - 4090.86 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1024 + - - 5 + - 589.015 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 2944 + - - 3 + - 4349.15 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3584 + - - 1 + - 3384.32 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 448 + - - 0 + - 2488.74 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 2368 + - - 0 + - 2397.18 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 448 + - - 1 + - 2344.82 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 2944 + - - 0 + - 1780.56 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 2944 + - - 3 + - 4267.95 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 3584 + - - 3 + - 4227.78 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 768 + - 5888 + - - 3 + - 3191.33 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 256 + - - 0 + - 1723.41 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3584 + - - 3 + - 4307.98 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1024 + - - 3 + - 3294.33 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 5888 + - - 3 + - 4126.79 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 448 + - - 1 + - 2346.21 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 768 + - 256 + - - 1 + - 1557.66 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 704 + - - 1 + - 2782.66 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 4 + - - 6 + - 53.2666 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 2368 + - - 3 + - 3829.36 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1408 + - - 1 + - 3651.59 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1024 + - - 1 + - 3223.15 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 2368 + - - 2 + - 3969.34 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1856 + - - 3 + - 3811.57 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 256 + - 448 + - - 1 + - 1241.79 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 448 + - - 1 + - 3315.74 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 256 + - 128 + - - 5 + - 60.2908 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 2368 + - - 3 + - 4255.72 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 448 + - - 1 + - 789.93 +- null diff --git a/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml b/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml new file mode 100644 index 000000000..1c28a5782 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml @@ -0,0 +1,12161 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 64 + LVCA: 8 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 32 + LVCA: 4 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x32x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 6 + - 2954.59 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 4 + - 4025.85 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 116.076 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 1 + - 845.171 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1972.31 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 2480.72 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 59.9816 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4257.57 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 3 + - 3289.8 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3303.91 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 1484.0 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3705.47 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 1238.89 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 5 + - 2209.44 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 3 + - 4001.8 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 7 + - 13.0749 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3907.7 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 74.4445 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 3 + - 4282.36 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 8 + - 120.803 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 3782.03 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 2976.19 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3847.68 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4112.42 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 6 + - 3046.15 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 449.449 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 62.3904 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 7 + - 3.39824 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 2200.75 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 3516.69 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4032.95 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 0 + - 3915.86 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 3413.62 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 2585.53 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 2676.32 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 6 + - 2610.68 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 5 + - 2760.48 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 7 + - 104.231 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 47.383 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 4 + - 3924.37 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 1289.67 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 3 + - 4057.1 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 3 + - 3225.34 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 0 + - 3503.28 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 4 + - 3301.1 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 0 + - 3759.95 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 4 + - 3445.79 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 4 + - 3442.49 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 6 + - 2882.31 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 4 + - 3759.15 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2018.01 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 8 + - 219.812 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 0 + - 3566.71 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3912.43 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 6 + - 2935.45 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 0 + - 3457.56 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 1594.49 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 5 + - 2992.89 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 3768.5 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 197.778 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 5 + - 2634.93 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 3 + - 3751.81 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 5 + - 2059.72 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4168.66 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 4 + - 3866.16 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 153.45 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 3 + - 4119.58 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 3268.41 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 5 + - 1929.12 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 4 + - 3553.24 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 6 + - 2971.75 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3894.12 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 6 + - 2896.24 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 5 + - 1313.5 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 5 + - 1682.69 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 1 + - 1860.07 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 2829.95 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 7 + - 85.9574 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 5 + - 1724.63 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 4 + - 3608.87 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2951.84 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 4 + - 3544.32 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3394.21 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 6 + - 2647.22 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 5 + - 2117.2 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 3077.93 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 3537.99 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 2.47794 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 3350.62 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 6 + - 2769.06 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2611.65 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3931.4 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 0 + - 3628.16 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 3.34032 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 1656.91 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 2845.71 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 45.7854 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 0 + - 3748.16 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4145.64 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 1867.3 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 0 + - 3791.39 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 504.215 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 3949.4 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 4 + - 3507.09 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 0.189148 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 0 + - 3491.21 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 3 + - 3243.14 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 3055.67 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 3974.1 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 6 + - 2313.73 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 2892.91 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3394.58 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 3161.19 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 94.5694 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 4 + - 3700.44 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 7 + - 47.3194 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 3 + - 4032.43 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 614.494 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 4 + - 3945.16 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 4 + - 3369.2 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3002.56 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 199.873 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3803.42 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 2333.84 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4137.48 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 3 + - 3794.16 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 137.801 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 3308.23 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 3306.04 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 2 + - 379.582 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 47.0106 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 3572.96 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 5 + - 1920.96 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3979.16 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4245.44 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 4 + - 3591.76 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3685.82 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 3 + - 4128.27 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3899.64 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 185.705 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 1542.23 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 2016.49 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 6 + - 3361.14 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 1730.08 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 3 + - 3968.13 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 1539.55 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3928.83 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 1477.08 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3802.97 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 3 + - 4251.2 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 7 + - 3.29931 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3234.49 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 399.61 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 3310.51 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 1 + - 1127.07 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 1229.4 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 5 + - 2483.92 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 4 + - 3449.25 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 44.6838 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 3 + - 3532.17 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 0 + - 3602.91 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 2 + - 557.951 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 2082.54 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 5 + - 2898.46 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3850.44 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 7 + - 56.5909 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 3 + - 3687.44 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3784.63 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2202.49 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 3 + - 3929.59 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 6 + - 2959.0 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 1213.31 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 3777.43 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3763.48 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 6 + - 3171.29 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 5 + - 1415.27 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 4 + - 4063.84 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1867.92 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 4 + - 2891.71 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4202.4 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 225.483 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 5 + - 1394.04 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3333.63 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 2 + - 258.161 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 3 + - 3878.62 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 0 + - 3495.89 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 3232.17 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1211.2 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 5 + - 1864.66 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 889.455 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 2540.22 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 2 + - 1213.26 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 3 + - 3415.1 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 1897.22 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3978.16 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 3 + - 3401.08 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 3971.91 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 3864.17 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 2 + - 1451.96 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 6 + - 2650.71 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 99.9024 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 536.026 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 3109.53 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 6 + - 3308.31 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 1632.02 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 3 + - 3452.57 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3642.52 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 2 + - 676.958 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3733.15 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 7 + - 42.4366 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 2 + - 1259.44 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 3578.36 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 7 + - 22.8941 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 3558.79 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3002.15 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2917.45 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 8 + - 76.6595 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 716.596 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 2 + - 434.321 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 23.5363 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 3 + - 3388.29 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4134.75 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 4 + - 3280.21 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 6 + - 2935.68 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 7 + - 66.36 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 1157.14 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 7 + - 6.74141 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2026.28 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 1 + - 2568.07 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 4 + - 3872.69 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 126.041 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 4074.29 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3320.38 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 0 + - 3955.26 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 2444.39 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2966.8 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 860.967 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4177.86 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 6 + - 2883.97 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 5 + - 2109.4 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 2356.82 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 7 + - 158.154 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 5 + - 3018.65 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 2 + - 345.417 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 1022.14 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 880.153 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 2 + - 1605.97 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 0 + - 3659.17 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 7 + - 13.429 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 2351.72 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 3985.1 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 1868.76 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 3240.85 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4121.05 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3714.4 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 64.5789 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 2793.34 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 4 + - 3457.72 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 3307.29 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 2 + - 854.784 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 3 + - 3676.24 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 2059.89 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 5 + - 2163.63 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 6 + - 3219.27 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 2405.82 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3520.4 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 679.353 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 0 + - 3815.12 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 4022.07 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 108.933 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 1 + - 1140.96 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 7 + - 4.88687 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 3431.58 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3291.2 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 6 + - 3216.38 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 4 + - 3500.9 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3963.31 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 1937.87 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 2 + - 884.522 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 1 + - 2568.63 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 3523.17 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 4 + - 3557.97 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 4 + - 3019.04 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 6.25454 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 5 + - 2023.96 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 2081.99 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 53.8336 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1459.06 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4235.25 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 5 + - 1552.34 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1754.44 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 3832.67 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 5 + - 2774.48 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2506.29 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3983.94 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 6 + - 2049.01 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 12.4363 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 4035.24 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 8 + - 112.578 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 0 + - 3777.6 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 2 + - 615.139 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 5 + - 1469.36 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 3 + - 4162.26 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 4 + - 3807.08 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 150.802 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3953.73 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 2656.61 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 7 + - 43.1504 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3456.13 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 1330.25 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 3533.04 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3989.01 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 4 + - 3759.93 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 0 + - 3955.47 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 3260.15 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 2931.91 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3314.05 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 6 + - 1663.64 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 0 + - 3366.61 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 0 + - 3901.83 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3825.48 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 300.222 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 0 + - 3463.15 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3917.56 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 2894.32 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 5 + - 2950.38 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 72.7336 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4171.16 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 2471.0 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 3945.03 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3515.58 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 4 + - 3370.12 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 3 + - 3434.27 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3858.55 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 2561.33 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 2379.07 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 5 + - 2854.89 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 7 + - 93.9893 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3518.31 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 7 + - 60.5684 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 3884.63 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 4324.6 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 7 + - 31.2047 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 1674.28 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 2 + - 1016.78 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 1599.11 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 0 + - 3444.48 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 3 + - 4132.45 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 2 + - 1257.43 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 3 + - 3214.23 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 56.7984 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 3077.58 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 6 + - 2772.91 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 5 + - 2591.06 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 2 + - 536.558 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 4 + - 3915.26 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 3.41876 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3252.95 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3888.51 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3946.23 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 5 + - 2524.57 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 7 + - 2.48897 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 4 + - 3734.78 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 1 + - 3040.71 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4119.12 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 3 + - 4012.64 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4151.1 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 753.022 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 4025.26 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 710.826 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 3292.4 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 1494.64 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2649.35 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 0 + - 3389.44 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4259.43 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 1960.4 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 108.675 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 2 + - 1154.88 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 5 + - 1281.64 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 6 + - 2264.13 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4108.75 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 0 + - 3627.7 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3763.17 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 7 + - 72.78 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 3114.58 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 3923.11 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 2880.72 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 6 + - 2684.96 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1108.79 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 3 + - 3036.86 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3979.84 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 5 + - 2082.23 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 0 + - 3280.2 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 6.60929 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 4024.75 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3940.16 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3272.78 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 4026.52 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 1015.51 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 5 + - 3003.32 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 5 + - 2609.94 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3803.62 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 3 + - 3782.58 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 2308.14 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2907.82 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4216.97 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4040.01 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 3322.98 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3207.4 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 7 + - 99.1004 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 0.205247 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 3 + - 3970.49 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 7 + - 76.7561 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1382.88 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 3785.46 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 2 + - 593.586 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 7 + - 82.4428 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 4014.26 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 0.147297 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 4 + - 3732.83 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 1 + - 1710.7 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 3 + - 3960.69 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3955.15 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 2241.05 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 6 + - 3275.56 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 9.95386 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 2 + - 717.905 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 5 + - 1217.5 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 4 + - 3939.37 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 5 + - 2765.1 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 3160.15 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 3 + - 4037.76 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 2933.2 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 5 + - 1211.49 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 21.8833 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 6 + - 2966.72 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2912.42 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 6 + - 2914.8 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 5 + - 1995.58 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 108.24 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 5 + - 2322.55 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 217.221 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 5 + - 1619.33 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 4 + - 3894.97 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3867.84 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 4084.35 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 1488.61 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 2116.81 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3882.16 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 2980.45 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 7 + - 138.205 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 7 + - 6.1811 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3256.35 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 2 + - 500.457 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 5 + - 2214.22 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 140.466 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 3451.74 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 3180.68 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 2723.57 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 4 + - 3434.31 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 3 + - 3961.62 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 1 + - 1516.34 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 2204.84 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 31.6601 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 7 + - 103.546 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3802.0 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 4 + - 3844.41 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 2508.24 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4091.78 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 1 + - 1108.79 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 2097.85 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 0 + - 3608.38 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3494.14 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 7 + - 65.54 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 0 + - 3767.59 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 5 + - 1153.71 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3941.89 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3756.48 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 3 + - 3591.21 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 2444.08 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 3 + - 3223.06 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3734.12 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 3 + - 4139.0 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 8 + - 86.4303 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 2 + - 1945.87 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 3 + - 3928.89 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 3 + - 3418.02 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 16.6311 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4170.31 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 3048.08 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3134.49 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 2069.02 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 5 + - 952.035 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 1 + - 1578.36 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3645.8 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 5 + - 1495.33 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 1 + - 1764.85 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 3 + - 3366.48 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 8 + - 80.1206 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 2055.88 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 0 + - 3834.83 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 4011.32 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 149.863 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3404.19 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 4109.44 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 6 + - 2498.26 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 6.70746 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 69.7989 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4248.83 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 2 + - 1674.96 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 6 + - 2646.07 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 4150.71 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 3 + - 3731.23 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 3 + - 3713.5 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 4 + - 3691.7 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 2 + - 1532.18 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 162.997 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 4 + - 3803.42 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 4025.75 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 2439.4 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 8 + - 114.954 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4252.25 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3862.28 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 3102.19 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 3214.28 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4055.76 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 3804.86 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 3 + - 3857.54 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 3 + - 3810.17 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 4 + - 3294.59 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 3 + - 4213.43 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 4151.42 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 104.221 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 782.339 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 1 + - 2243.95 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 4 + - 3843.13 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 3896.45 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 34.9587 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 0 + - 3504.68 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 3 + - 4358.78 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1295.8 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 3 + - 3553.18 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 3 + - 3844.99 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 3 + - 3526.8 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 7 + - 22.457 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 2623.53 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 7 + - 3.08332 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4016.52 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 112.535 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 0 + - 3777.84 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 5 + - 1905.07 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3698.4 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 43.2817 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 5 + - 2132.15 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 0 + - 3322.72 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 3 + - 3990.69 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 6 + - 3470.39 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 4 + - 3336.99 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 262.494 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 4 + - 3524.82 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 7 + - 20.8929 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3273.35 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 2290.86 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 4026.55 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 853.492 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 564.864 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 4 + - 3504.03 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 1937.26 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 4169.33 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 6 + - 2191.68 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3757.99 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 6 + - 2608.83 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 3197.71 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 1722.02 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 7 + - 125.372 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3619.11 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 7 + - 114.523 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 3 + - 4077.13 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 0 + - 3385.18 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 1869.17 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3291.09 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 5 + - 1756.0 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 3812.85 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2214.76 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 6 + - 2976.54 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 5 + - 2481.64 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 3343.25 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 6 + - 2830.61 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 5 + - 1100.29 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 7 + - 65.1619 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 0 + - 3104.21 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 2018.85 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2060.07 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 1560.44 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 3 + - 3902.03 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3309.7 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 558.545 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 0 + - 3829.35 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 0 + - 3777.6 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 1 + - 3223.43 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2858.71 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 133.193 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 3 + - 4031.67 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 891.821 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 6 + - 2437.19 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 3.13365 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 6 + - 2900.65 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 1406.75 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 4 + - 3738.0 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 3304.99 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 215.765 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3898.43 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 2 + - 768.813 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 3 + - 3892.4 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 66.1967 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 1 + - 2563.12 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 3963.2 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 4 + - 3863.82 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1606.41 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 23.0616 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 5 + - 2049.52 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 7 + - 127.111 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3502.73 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 5 + - 2732.77 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 3000.67 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4122.05 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 5 + - 1994.21 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 3 + - 3866.88 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1665.22 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 3366.98 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 3597.57 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 6 + - 2658.23 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 1067.89 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 2512.74 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1943.57 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 3 + - 3528.29 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 0 + - 3564.84 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 7 + - 21.8379 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 7 + - 158.333 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1924.3 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4351.33 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2424.08 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 7 + - 138.197 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3343.06 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 299.593 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2646.56 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 3131.85 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 7 + - 206.195 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 6 + - 2613.54 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4401.65 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3733.95 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3287.15 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 0 + - 3815.37 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 4 + - 3909.32 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 3 + - 3793.79 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 0 + - 3543.9 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 3980.55 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2512.58 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 3052.26 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 2708.82 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 2908.72 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 1737.12 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 2 + - 766.876 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 4 + - 3299.07 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4032.77 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4067.76 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 6 + - 3466.62 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 2170.99 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1386.94 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 4 + - 3608.02 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3606.13 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 5 + - 1467.93 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 4059.27 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 1 + - 2296.74 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 4 + - 3785.39 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3701.49 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 3977.24 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 2379.08 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4102.61 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 2341.32 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 5 + - 2450.42 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3443.87 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 8 + - 66.1168 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 2727.52 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 4370.81 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 3797.12 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 378.866 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2701.07 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 6 + - 3351.04 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 449.32 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 4395.29 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 3 + - 3937.21 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 13.4054 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 5 + - 1791.16 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 8 + - 65.9035 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 6 + - 3172.76 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 2684.04 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 0 + - 3900.43 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2857.86 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 4 + - 3631.34 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 1687.36 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 3783.43 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 2 + - 713.288 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 225.314 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 6 + - 3141.68 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 3001.0 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 0 + - 3973.4 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 74.3601 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3431.86 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 101.132 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 3 + - 3963.75 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 3357.32 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 5 + - 2515.24 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 4 + - 3871.99 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 3737.94 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 5 + - 1729.74 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 4300.2 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 3 + - 3844.76 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 7 + - 29.848 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 3325.97 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 0 + - 3760.19 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 4 + - 3198.2 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 5 + - 1146.84 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 13.1003 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 5 + - 2202.94 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 4 + - 3004.89 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3112.16 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 31.887 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 3788.3 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 7 + - 182.016 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 0 + - 3758.34 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 4 + - 3605.79 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 2197.54 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 392.337 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 0 + - 3137.03 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 84.8213 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3877.88 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2484.13 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 5 + - 2510.52 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 3 + - 4100.18 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 5 + - 1807.42 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 3005.78 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 32.6355 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 6 + - 3173.73 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2437.49 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 2934.74 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1967.37 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 0 + - 3635.13 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 5 + - 2403.67 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 2 + - 890.209 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 2648.92 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2139.22 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 3 + - 3735.88 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3943.16 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 6 + - 2871.9 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 1837.92 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 4 + - 3908.47 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 2 + - 1212.11 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 5.09562 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 3 + - 3905.33 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 5 + - 1175.61 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 395.457 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 6 + - 3153.54 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 5 + - 2408.47 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 4 + - 2887.5 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3775.55 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 3838.62 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1152.56 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 5 + - 1333.26 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 2 + - 1584.84 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3515.84 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3800.37 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 1946.66 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 6 + - 2884.28 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 6 + - 2503.69 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 4 + - 3457.54 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1549.72 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 2738.42 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 0 + - 3913.15 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 1758.9 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1140.69 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 7 + - 16.0478 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 6 + - 1920.85 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 149.696 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 2750.63 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 1481.63 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 6 + - 1495.86 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 2324.93 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 4021.58 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 55.7085 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 6 + - 2659.91 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 2 + - 401.315 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 5 + - 2900.11 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 2605.0 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 7 + - 32.5243 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4132.5 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 34.1077 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 4 + - 3840.55 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 2926.91 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 90.5271 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 3455.76 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 4 + - 3949.71 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 2 + - 1156.91 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3137.52 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 2 + - 198.828 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 4 + - 3739.9 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4019.39 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 0 + - 3725.79 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 4 + - 3824.97 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 434.27 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 5 + - 1989.69 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1698.88 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 3 + - 3780.08 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 4 + - 3444.79 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 7 + - 90.2377 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 223.971 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 3015.48 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 3 + - 3835.43 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 2890.97 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 3940.37 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 6 + - 3004.32 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3877.45 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 4027.68 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 6 + - 3226.99 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4362.06 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 1297.0 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 153.36 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 0 + - 3910.82 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 1 + - 1888.46 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 5 + - 2150.46 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 6 + - 3355.82 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4149.16 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 6 + - 2999.52 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 7 + - 9.73118 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 2744.47 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3498.06 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2269.99 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 2 + - 396.054 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 7 + - 109.453 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 4034.28 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 7 + - 67.9596 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 2895.62 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 5 + - 1551.01 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1498.35 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 2914.21 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 109.235 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 4358.17 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 3119.82 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 5 + - 1657.55 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 3 + - 3256.66 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 3112.91 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 7 + - 33.9483 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 112.704 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 66.5315 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 5 + - 3052.22 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 76.2308 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 1 + - 2663.87 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2933.66 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 6 + - 3280.2 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4052.64 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 2 + - 852.963 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4082.68 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 0 + - 3564.95 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 2 + - 855.481 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 4008.36 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 0 + - 3838.1 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 4247.41 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 4 + - 3273.85 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4387.22 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3802.95 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 4 + - 3517.16 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3263.1 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 5 + - 2467.98 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3331.87 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 4129.55 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 6 + - 2519.79 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 3041.59 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 4 + - 3148.94 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 4001.27 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 5 + - 2888.31 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 65.2708 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3844.53 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 7 + - 176.16 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 5 + - 1420.67 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 2731.74 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2697.6 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 7 + - 139.557 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 4 + - 2932.99 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 2671.15 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 3 + - 3951.69 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 7 + - 62.5511 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 2730.59 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 3 + - 4053.56 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2149.69 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3943.73 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 855.631 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 3 + - 3804.87 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 5 + - 1552.23 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 0 + - 3382.74 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 4 + - 3561.34 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 1 + - 2677.42 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 2569.11 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 3851.13 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 0 + - 3288.72 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 3 + - 3359.9 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 7 + - 6.58145 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3759.49 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 1792.92 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 3177.83 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3495.41 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 2071.18 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 5 + - 3013.89 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3872.27 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 6 + - 2979.62 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 3060.39 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 3908.24 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 3381.96 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 5 + - 2025.58 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 0 + - 3276.42 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 5 + - 1673.68 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 8 + - 71.5333 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 0.211818 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 2 + - 217.986 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 2125.93 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 2 + - 1299.37 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1791.09 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 1 + - 1112.35 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3826.11 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 2129.68 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 7 + - 127.058 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 4074.23 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 1 + - 2861.38 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 6 + - 2959.27 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 3 + - 3439.95 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 4036.06 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 3181.9 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 3934.24 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 176.292 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 99.6577 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 6 + - 2933.5 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3460.7 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 1 + - 2362.88 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 5 + - 1911.27 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 2309.77 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3903.22 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 4 + - 3096.87 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 4219.73 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3949.36 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 3 + - 4109.02 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 5 + - 1217.42 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 2 + - 1549.53 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 0 + - 3598.13 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3937.09 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 3 + - 3930.61 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1100.29 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 6 + - 3043.2 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 163.696 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 2 + - 753.11 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 1 + - 965.94 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 3 + - 3980.24 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 764.826 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 3 + - 3975.0 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 4363.13 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 2 + - 1020.46 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 3 + - 4126.19 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 2380.28 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3938.53 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1584.13 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 592.656 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 2 + - 781.963 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 128.374 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 2901.92 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4134.91 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3872.77 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3197.89 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3556.2 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 4 + - 3281.84 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 3930.75 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 7 + - 12.2279 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4336.2 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 6 + - 3474.12 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 2483.9 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 3819.24 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 3 + - 4022.48 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 108.675 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 342.75 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4161.07 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 0 + - 3572.4 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 6 + - 3278.06 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 21.307 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 1532.18 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 3 + - 3314.65 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 2 + - 1868.42 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 0 + - 4019.86 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 0 + - 3758.65 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 6 + - 3130.46 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 1 + - 1112.35 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 81.9581 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 3796.02 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 3 + - 4291.75 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 5 + - 3058.7 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3492.85 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 0 + - 3764.21 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 2 + - 392.81 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 2778.18 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3783.16 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 2995.2 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3806.19 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 2205.16 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 3 + - 3991.52 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 3 + - 4131.3 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 2 + - 1498.85 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 1943.97 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 1 + - 2351.63 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 4044.93 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 3228.83 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 6 + - 3272.83 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 2539.14 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1252.53 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 4 + - 3504.5 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 2 + - 1451.8 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 0 + - 3374.04 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 7 + - 45.5761 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 1111.09 +- null diff --git a/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml b/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml new file mode 100644 index 000000000..06be19da4 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml @@ -0,0 +1,11947 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 16 + LSPB: 8 + LVCA: 16 + LVCB: 32 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 128 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 8 + LSPB: 16 + LVCA: 32 + LVCB: 16 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 704 + - - 0 + - 2919.39 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1408 + - - 3 + - 3965.21 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 3399.4 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1856 + - - 3 + - 3677.9 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 704 + - - 2 + - 4025.67 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1856 + - - 1 + - 4099.34 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 704 + - 128 + - - 5 + - 687.223 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 448 + - - 0 + - 3882.38 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1024 + - - 2 + - 2991.29 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 3361.73 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 256 + - - 3 + - 3403.36 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 3584 + - - 4 + - 4166.96 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1856 + - - 5 + - 882.062 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 128 + - - 5 + - 2048.56 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 6784 + - - 1 + - 4227.19 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 64 + - - 0 + - 2273.46 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 4 + - 6784 + - - 6 + - 194.253 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 5888 + - - 0 + - 3475.26 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 5056 + - - 4 + - 4213.88 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 448 + - - 0 + - 4202.37 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1856 + - - 2 + - 4153.36 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 2368 + - - 0 + - 3619.5 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 6784 + - - 3 + - 3128.03 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 4 + - - 6 + - 149.186 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 128 + - - 0 + - 2511.61 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1408 + - - 6 + - 39.7262 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1856 + - - 5 + - 4017.34 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 4288 + - - 4 + - 4130.97 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 64 + - 5888 + - - 0 + - 1980.08 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 64 + - 64 + - - 5 + - 41.1402 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2944 + - - 3 + - 2489.92 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3287.9 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 6784 + - - 1 + - 4140.0 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1024 + - - 5 + - 3273.89 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3470.26 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 448 + - - 5 + - 3790.78 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3584 + - - 6 + - 128.44 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1024 + - - 2 + - 3437.89 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1856 + - - 3 + - 4009.11 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 669.456 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 2944 + - - 2 + - 4215.74 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 2944 + - - 3 + - 3651.59 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 4 + - - 6 + - 161.666 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 6784 + - - 4 + - 4422.41 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1024 + - - 6 + - 38.4202 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1856 + - - 3 + - 3710.2 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 5888 + - - 6 + - 196.019 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 471.175 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 3584 + - - 4 + - 4043.78 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1024 + - - 5 + - 3721.51 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 5056 + - - 1 + - 4197.94 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1408 + - - 3 + - 3770.16 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 128 + - - 5 + - 1559.53 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 4 + - - 6 + - 5.6044 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 4 + - 704 + - - 6 + - 21.193 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 64 + - - 5 + - 940.711 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 704 + - 6784 + - - 3 + - 3800.68 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 704 + - - 0 + - 525.528 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 4 + - - 6 + - 160.47 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 4 + - 2944 + - - 6 + - 83.1375 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 3 + - 2502.66 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3773.07 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 6784 + - - 1 + - 4366.11 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 704 + - 4 + - - 6 + - 20.9987 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 4288 + - - 4 + - 4129.09 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 64 + - - 0 + - 333.558 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 64 + - - 5 + - 789.73 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 2944 + - - 1 + - 4258.3 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 128 + - - 3 + - 3066.76 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 704 + - 704 + - - 5 + - 2265.32 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1408 + - - 5 + - 4027.4 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 4288 + - - 0 + - 4095.44 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 2368 + - - 3 + - 4148.74 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 5056 + - - 4 + - 4267.51 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 5888 + - - 3 + - 3943.23 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 704 + - 704 + - - 5 + - 1764.42 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 256 + - 448 + - - 5 + - 1189.51 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 2368 + - - 5 + - 3576.62 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5056 + - - 3 + - 3022.54 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 2368 + - - 6 + - 86.8332 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1408 + - - 3 + - 4153.8 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3584 + - - 4 + - 4219.31 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 3584 + - - 5 + - 3646.0 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 2368 + - - 3 + - 4137.56 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1024 + - - 4 + - 3614.3 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 2368 + - - 3 + - 3987.25 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1856 + - - 5 + - 2304.16 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 64 + - - 0 + - 3547.32 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 4288 + - - 5 + - 2766.27 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 448 + - - 5 + - 334.09 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 8.75529 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 256 + - - 5 + - 2169.37 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 128 + - 448 + - - 0 + - 443.741 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 448 + - 2944 + - - 3 + - 3463.05 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 448 + - - 5 + - 4088.07 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 2944 + - - 1 + - 3992.62 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 704 + - 6784 + - - 3 + - 3982.47 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 64 + - 2944 + - - 5 + - 1284.11 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 5056 + - - 5 + - 2771.32 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1024 + - - 2 + - 3487.93 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3806.84 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 1925.42 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 2944 + - - 3 + - 3911.12 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 448 + - - 3 + - 3083.38 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 704 + - - 3 + - 3828.1 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 704 + - - 0 + - 3364.48 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 2368 + - - 3 + - 3930.02 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 448 + - - 0 + - 3522.83 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 448 + - 448 + - - 5 + - 1344.94 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 4288 + - - 1 + - 4182.27 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 5888 + - - 1 + - 4196.28 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 2944 + - - 0 + - 3188.23 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 448 + - - 3 + - 2522.12 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 8.91734 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 5056 + - - 4 + - 4422.36 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1856 + - - 3 + - 3887.18 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 6784 + - - 0 + - 3903.22 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1408 + - - 3 + - 3687.66 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 5056 + - - 4 + - 4181.82 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 64 + - - 0 + - 2370.45 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 128 + - 2368 + - - 5 + - 1645.26 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 5888 + - - 2 + - 4314.85 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1856 + - - 0 + - 2409.83 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 64 + - - 5 + - 1433.88 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 128 + - 64 + - - 5 + - 63.5965 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 191.553 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 4 + - - 6 + - 193.292 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 11.4122 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 4288 + - - 3 + - 4153.91 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 128 + - - 6 + - 5.74574 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 6784 + - - 1 + - 4401.5 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 256 + - 2368 + - - 0 + - 2606.89 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 704 + - - 5 + - 3956.89 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 6784 + - - 1 + - 4362.62 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 448 + - - 3 + - 2147.97 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1024 + - - 3 + - 3002.64 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1856 + - - 3 + - 4045.93 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1024 + - - 2 + - 3822.18 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 6784 + - - 5 + - 4049.53 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1408 + - - 3 + - 4054.63 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 704 + - 4288 + - - 3 + - 3367.98 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 64 + - - 5 + - 1737.41 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 2944 + - - 0 + - 3102.42 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1856 + - - 3 + - 3245.54 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1856 + - - 6 + - 51.8408 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 0 + - 257.341 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 256 + - - 5 + - 199.222 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 4 + - - 6 + - 51.9996 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 704 + - 2368 + - - 3 + - 3029.67 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 5888 + - - 1 + - 4363.5 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 704 + - - 2 + - 3966.3 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3242.83 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 704 + - - 5 + - 2153.58 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 5888 + - - 2 + - 4119.9 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 2944 + - - 3 + - 3977.27 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 64 + - 704 + - - 5 + - 347.421 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 5056 + - - 5 + - 2791.61 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 4 + - - 6 + - 0.181457 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1024 + - - 6 + - 37.9774 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 3584 + - - 2 + - 4350.48 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 4 + - - 6 + - 137.692 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1024 + - - 0 + - 1341.28 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 3584 + - - 1 + - 4245.11 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 128 + - - 5 + - 1799.74 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 128 + - 5888 + - - 3 + - 2935.41 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 64 + - 448 + - - 0 + - 223.673 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 64 + - - 5 + - 680.013 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 4 + - - 6 + - 168.606 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 6784 + - - 0 + - 3658.8 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 6784 + - - 4 + - 4213.36 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 704 + - 4 + - - 6 + - 27.6418 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 4288 + - - 4 + - 4214.89 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 64 + - - 5 + - 490.142 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 4 + - - 6 + - 99.326 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 64 + - - 5 + - 1537.3 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 128 + - - 5 + - 2278.34 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 704 + - 448 + - - 5 + - 1704.64 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 128 + - - 5 + - 95.7 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 2944 + - - 1 + - 3968.33 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 4288 + - - 5 + - 2277.51 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2368 + - - 3 + - 2056.4 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 5888 + - - 3 + - 4018.88 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 859.223 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 10.6206 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 64 + - - 0 + - 3712.23 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 2368 + - - 3 + - 4076.08 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 5056 + - - 1 + - 4312.58 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 3584 + - - 4 + - 3394.7 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 5888 + - - 4 + - 4311.26 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 5888 + - - 3 + - 4107.54 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1024 + - - 6 + - 28.4982 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 5056 + - - 4 + - 4136.75 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 2944 + - - 0 + - 3243.99 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 448 + - - 0 + - 2389.52 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 64 + - 4288 + - - 5 + - 2038.08 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 5 + - 1920.05 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 256 + - 2944 + - - 3 + - 2934.06 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 2368 + - - 5 + - 4108.74 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1024 + - - 5 + - 791.749 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 448 + - - 3 + - 3360.26 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 2368 + - - 6 + - 84.147 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 128 + - 5056 + - - 3 + - 2191.32 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 704 + - 3584 + - - 0 + - 3426.21 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 2680.25 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1408 + - - 3 + - 3673.83 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 4 + - - 6 + - 166.453 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1408 + - - 3 + - 2373.74 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1856 + - - 2 + - 3912.6 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 256 + - 128 + - - 5 + - 343.771 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1408 + - - 5 + - 3792.27 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 448 + - - 6 + - 19.7668 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 6784 + - - 0 + - 3783.6 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 2944 + - - 5 + - 2129.29 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 5056 + - - 3 + - 4049.81 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 198.595 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 448 + - 6784 + - - 3 + - 3388.94 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1024 + - - 4 + - 3246.95 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 704 + - - 5 + - 3735.54 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1856 + - - 3 + - 3963.13 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 5888 + - - 4 + - 4253.42 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 704 + - - 3 + - 3642.9 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1856 + - - 3 + - 3856.09 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1408 + - - 3 + - 3868.6 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1408 + - - 5 + - 939.01 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 256 + - - 5 + - 1945.21 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 704 + - 3584 + - - 1 + - 3165.88 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3584 + - - 0 + - 3983.17 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 4288 + - - 0 + - 3524.27 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 2944 + - - 1 + - 4222.0 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 704 + - - 5 + - 546.677 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 2368 + - - 0 + - 2868.13 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 64 + - - 5 + - 2751.86 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 2368 + - - 1 + - 4161.93 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 6784 + - - 1 + - 4400.04 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 704 + - 2944 + - - 0 + - 3535.95 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1024 + - - 2 + - 4106.69 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 4 + - - 6 + - 82.772 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1408 + - - 0 + - 2654.29 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 448 + - - 3 + - 3379.49 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 448 + - 2368 + - - 3 + - 2521.25 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 2944 + - - 1 + - 4177.8 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 5056 + - - 6 + - 167.599 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 5888 + - - 1 + - 4228.5 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 4288 + - - 1 + - 4214.57 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1408 + - - 5 + - 2539.01 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1024 + - - 5 + - 3901.52 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 128 + - 6784 + - - 3 + - 3354.88 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 11.4137 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 448 + - - 3 + - 2765.1 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3584 + - - 0 + - 3690.82 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1408 + - - 1 + - 4184.21 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1408 + - - 0 + - 3108.57 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 6784 + - - 1 + - 3976.58 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 64 + - - 5 + - 1488.62 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 2944 + - - 1 + - 4125.34 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1024 + - - 3 + - 2724.02 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 5056 + - - 1 + - 4242.95 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 704 + - - 5 + - 4001.2 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 4 + - 4288 + - - 6 + - 118.631 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 704 + - - 5 + - 3209.86 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 4245.93 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1408 + - - 3 + - 3968.21 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 128 + - - 0 + - 1640.81 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 4288 + - - 3 + - 3969.99 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 5888 + - - 3 + - 4128.28 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1856 + - - 3 + - 3365.97 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 64 + - 64 + - - 5 + - 28.656 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 6784 + - - 1 + - 4301.03 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 764.961 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1408 + - - 3 + - 3358.94 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 4288 + - - 4 + - 4356.44 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 128 + - 3584 + - - 0 + - 2296.4 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 64 + - 5888 + - - 0 + - 2748.52 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 256 + - 5056 + - - 3 + - 3403.11 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 2944 + - - 3 + - 3271.25 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 128 + - - 5 + - 3106.07 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 2368 + - - 1 + - 4199.88 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 704 + - - 3 + - 3064.95 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 448 + - 6784 + - - 5 + - 3669.47 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 704 + - - 5 + - 1091.74 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 3 + - 3108.32 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3584 + - - 4 + - 4114.57 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 448 + - 704 + - - 5 + - 1710.41 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1856 + - - 1 + - 4048.53 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 4288 + - - 2 + - 4375.13 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1856 + - - 3 + - 3056.89 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 3584 + - - 1 + - 4078.37 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3584 + - - 2 + - 4385.26 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 5888 + - - 1 + - 4266.21 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1408 + - - 3 + - 2981.34 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 256 + - - 3 + - 2384.76 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 448 + - - 0 + - 3719.08 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 704 + - - 3 + - 2370.78 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 5056 + - - 2 + - 4030.12 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3144.93 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 2368 + - - 3 + - 4014.13 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3182.26 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 2944 + - - 6 + - 102.866 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 2944 + - - 3 + - 3928.88 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 5888 + - - 4 + - 4298.98 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 128 + - 5056 + - - 5 + - 2552.59 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 6784 + - - 0 + - 3555.36 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3584 + - - 1 + - 4062.15 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 442.314 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 5888 + - - 3 + - 4167.2 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 2368 + - - 3 + - 4072.45 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 128 + - 448 + - - 5 + - 601.425 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3584 + - - 0 + - 3903.22 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3584 + - - 4 + - 4363.34 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 5056 + - - 3 + - 3876.46 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 4288 + - - 3 + - 4142.95 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 448 + - - 5 + - 3515.64 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1024 + - - 0 + - 1410.17 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1856 + - - 5 + - 4201.36 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 704 + - 2944 + - - 3 + - 3102.86 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 448 + - - 0 + - 3897.55 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 448 + - - 3 + - 2916.8 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 2368 + - - 0 + - 3313.33 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 2368 + - - 0 + - 4127.77 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 5056 + - - 5 + - 2677.48 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3584 + - - 4 + - 4106.38 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3584 + - - 5 + - 3759.1 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1408 + - - 3 + - 3889.9 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2766.18 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1024 + - - 4 + - 3392.31 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 704 + - - 5 + - 3652.11 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1856 + - - 2 + - 4114.36 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 5888 + - - 0 + - 3931.65 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 3584 + - - 4 + - 4088.58 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 6784 + - - 1 + - 4264.6 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 64 + - - 5 + - 2393.97 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 128 + - - 6 + - 5.77385 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2702.46 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 64 + - - 5 + - 3232.71 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 4288 + - - 3 + - 4016.92 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 1795.26 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1408 + - - 3 + - 3651.26 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 397.985 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 256 + - - 3 + - 2923.86 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1856 + - - 3 + - 4140.71 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 5056 + - - 4 + - 4087.73 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 4108.79 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 2944 + - - 1 + - 4161.96 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 704 + - - 0 + - 2531.6 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 704 + - 5888 + - - 3 + - 3650.25 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 128 + - - 5 + - 1248.85 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 10.7814 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 64 + - - 5 + - 1091.32 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 448 + - - 0 + - 2731.77 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1408 + - - 5 + - 2705.09 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 704 + - - 5 + - 3644.53 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 448 + - - 3 + - 3441.81 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 3584 + - - 4 + - 4355.7 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 4288 + - - 5 + - 2678.95 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1856 + - - 3 + - 3687.53 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 4288 + - - 3 + - 3997.74 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 448 + - 4 + - - 6 + - 18.2225 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 256 + - 704 + - - 5 + - 1796.63 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1856 + - - 3 + - 3852.39 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1856 + - - 2 + - 3722.71 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 128 + - 128 + - - 5 + - 122.06 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 2368 + - - 3 + - 3684.15 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 2368 + - - 3 + - 3991.39 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 64 + - 704 + - - 0 + - 471.278 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3445.52 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 64 + - 2368 + - - 5 + - 1080.91 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 64 + - - 5 + - 1284.84 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 256 + - 4288 + - - 0 + - 3173.46 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 4 + - - 6 + - 37.2204 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 256 + - 6784 + - - 0 + - 3457.62 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 4 + - 128 + - - 6 + - 5.43 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 2368 + - - 5 + - 2514.34 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 4276.42 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 128 + - 3584 + - - 0 + - 3274.21 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1024 + - - 0 + - 760.575 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 448 + - - 0 + - 3564.22 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 546.018 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 128 + - - 5 + - 3248.47 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 4 + - 5056 + - - 6 + - 154.793 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1408 + - - 3 + - 3298.29 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 3584 + - - 3 + - 2785.95 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1024 + - - 3 + - 3645.14 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 64 + - - 0 + - 95.9735 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 2944 + - - 1 + - 4141.45 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 5056 + - - 3 + - 3888.62 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 128 + - - 5 + - 1337.19 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 2368 + - - 3 + - 3801.51 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 6784 + - - 1 + - 4377.32 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 4 + - - 6 + - 127.696 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 4 + - - 6 + - 142.208 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 3584 + - - 4 + - 4241.77 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 6784 + - - 6 + - 219.994 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 256 + - - 5 + - 2978.48 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 2368 + - - 3 + - 4103.33 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 448 + - - 0 + - 3374.02 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 216.495 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1408 + - - 0 + - 2915.64 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 4 + - 3584 + - - 6 + - 100.063 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 64 + - - 5 + - 1089.32 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 3584 + - - 2 + - 4118.68 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 448 + - 3584 + - - 3 + - 2729.9 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 448 + - - 0 + - 3101.32 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 64 + - - 5 + - 2207.16 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 382.64 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 6784 + - - 0 + - 4087.13 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3975.75 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 3 + - 2598.69 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 64 + - - 6 + - 2.85864 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 3584 + - - 1 + - 4014.94 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 2368 + - - 1 + - 3977.02 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 6784 + - - 3 + - 3942.58 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 1189.59 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 4 + - - 6 + - 2.78307 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 704 + - 128 + - - 5 + - 941.598 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 2944 + - - 1 + - 3872.53 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1856 + - - 0 + - 3874.81 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1024 + - - 4 + - 3603.09 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 448 + - 5888 + - - 3 + - 3386.81 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 704 + - - 5 + - 2726.63 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 3584 + - - 1 + - 4275.11 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 448 + - - 3 + - 3259.95 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1024 + - - 2 + - 3951.87 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 4288 + - - 4 + - 4366.67 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1856 + - - 5 + - 1434.07 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 704 + - - 5 + - 3703.12 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 6784 + - - 1 + - 4221.55 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 2944 + - - 3 + - 3693.09 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1024 + - - 3 + - 3436.38 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1856 + - - 4 + - 4077.22 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 256 + - 5888 + - - 0 + - 3239.3 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1024 + - - 0 + - 2263.62 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 64 + - 3584 + - - 0 + - 2182.38 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 5 + - 1413.49 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 2853.3 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 64 + - - 5 + - 683.208 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 128 + - 4 + - - 6 + - 4.35437 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 2368 + - - 5 + - 1733.62 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1856 + - - 5 + - 2819.97 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 4288 + - - 3 + - 3793.18 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 5056 + - - 2 + - 3965.06 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 1331.51 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 64 + - - 0 + - 2676.56 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 2944 + - - 0 + - 3290.5 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 3584 + - - 5 + - 3684.08 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 448 + - - 5 + - 3666.83 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 2944 + - - 5 + - 2247.73 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 5056 + - - 3 + - 4085.38 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 4 + - 2944 + - - 6 + - 97.1723 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 170.47 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 5056 + - - 3 + - 3750.12 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 2944 + - - 0 + - 3852.27 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1024 + - - 4 + - 3334.32 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1408 + - - 3 + - 3909.9 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 448 + - 448 + - - 5 + - 1975.49 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 6784 + - - 1 + - 4175.26 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3584 + - - 1 + - 4286.17 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 128 + - - 5 + - 2618.29 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 704 + - 5056 + - - 3 + - 3504.31 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1024 + - - 3 + - 3489.25 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 2944 + - - 1 + - 4288.48 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 4 + - 5888 + - - 6 + - 149.024 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 128 + - 2944 + - - 5 + - 2762.93 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 5888 + - - 2 + - 4388.07 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 2944 + - - 1 + - 4258.33 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1856 + - - 5 + - 4067.08 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 448 + - 704 + - - 5 + - 2343.84 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1024 + - - 3 + - 2882.96 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 4 + - 4 + - - 6 + - 0.167285 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 128 + - - 0 + - 252.345 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 4288 + - - 2 + - 4329.74 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 3 + - 2043.4 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 3584 + - - 4 + - 4209.22 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1408 + - - 6 + - 52.9228 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 64 + - - 5 + - 759.656 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1408 + - - 3 + - 3952.8 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 5888 + - - 0 + - 3095.14 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 5888 + - - 3 + - 3892.37 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1408 + - - 0 + - 1918.56 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 3584 + - - 4 + - 4011.18 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1408 + - - 3 + - 3842.39 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 4288 + - - 0 + - 3819.09 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 5056 + - - 3 + - 4012.01 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 64 + - 4 + - - 6 + - 2.18921 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1024 + - - 4 + - 3673.03 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 64 + - - 5 + - 2706.1 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 5056 + - - 3 + - 4009.41 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1024 + - - 3 + - 3090.74 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 3584 + - - 4 + - 4087.91 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 3866.84 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 64 + - - 5 + - 1860.78 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 4288 + - - 4 + - 4328.08 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 5056 + - - 4 + - 4099.19 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 5888 + - - 1 + - 4197.38 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 6784 + - - 1 + - 4198.1 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1024 + - - 3 + - 2847.6 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 5888 + - - 3 + - 4142.4 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 6784 + - - 0 + - 3996.33 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 4288 + - - 3 + - 3914.84 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 6784 + - - 1 + - 4250.91 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 4 + - - 6 + - 132.309 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 64 + - - 0 + - 2035.98 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 704 + - - 6 + - 26.4869 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1024 + - - 4 + - 3550.13 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 3584 + - - 4 + - 4319.25 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 2368 + - - 3 + - 3776.85 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3707.19 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1408 + - - 0 + - 1235.65 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1024 + - - 4 + - 3547.96 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 2368 + - - 3 + - 3869.81 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 64 + - - 5 + - 3151.13 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 64 + - - 0 + - 525.454 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 704 + - - 0 + - 2456.3 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 4 + - - 6 + - 26.3506 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 4 + - - 6 + - 216.495 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 4 + - - 6 + - 100.881 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1408 + - - 3 + - 4014.39 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 3611.13 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 64 + - - 0 + - 99.7293 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 128 + - - 5 + - 3718.19 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 4288 + - - 4 + - 4293.61 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 3584 + - - 4 + - 4198.46 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1408 + - - 5 + - 3209.46 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3250.19 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 3584 + - - 1 + - 4044.21 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 4288 + - - 3 + - 4003.9 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 64 + - - 5 + - 1374.65 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 2368 + - - 1 + - 4211.22 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3837.98 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1408 + - - 1 + - 4180.09 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1856 + - - 5 + - 3818.01 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1856 + - - 3 + - 3440.88 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 3584 + - - 1 + - 4038.56 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 64 + - - 5 + - 1747.73 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 256 + - - 5 + - 2646.85 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 448 + - - 6 + - 18.4378 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 2944 + - - 3 + - 4010.93 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 5056 + - - 3 + - 4017.88 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 5056 + - - 1 + - 4207.49 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 343.822 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 2368 + - - 0 + - 3429.79 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 504.772 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 448 + - 2944 + - - 3 + - 3069.33 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 64 + - - 5 + - 46.7448 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 5056 + - - 3 + - 4102.31 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 128 + - 704 + - - 5 + - 686.57 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 5056 + - - 4 + - 4381.53 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 298.301 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2826.64 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 2944 + - - 3 + - 3838.04 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 2944 + - - 1 + - 4248.99 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 128 + - - 5 + - 1092.63 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 704 + - - 5 + - 3577.71 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1024 + - - 4 + - 3625.92 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1856 + - - 0 + - 4106.48 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 448 + - - 5 + - 696.217 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 448 + - - 5 + - 2815.38 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 2944 + - - 3 + - 3965.97 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3665.63 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 448 + - - 0 + - 2288.28 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 704 + - - 5 + - 2616.79 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3584 + - - 4 + - 4248.43 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 448 + - - 0 + - 1330.23 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 704 + - - 3 + - 3444.16 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 704 + - 2368 + - - 5 + - 3339.21 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 4 + - - 6 + - 104.423 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1024 + - - 0 + - 2173.33 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 4288 + - - 4 + - 4272.88 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 5888 + - - 3 + - 4047.97 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 4 + - 704 + - - 6 + - 27.9776 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 6784 + - - 0 + - 3814.9 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 5056 + - - 1 + - 4052.15 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 5888 + - - 4 + - 4400.94 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 5888 + - - 6 + - 189.146 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 5888 + - - 1 + - 4338.08 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 4288 + - - 1 + - 4320.35 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1856 + - - 3 + - 3415.85 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 3584 + - - 1 + - 4211.56 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 448 + - - 3 + - 3470.26 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 4288 + - - 3 + - 4113.36 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 5056 + - - 3 + - 4122.79 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1408 + - - 5 + - 3624.38 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 256 + - - 0 + - 191.101 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 128 + - 704 + - - 5 + - 940.712 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 448 + - - 0 + - 3860.84 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 64 + - 6784 + - - 0 + - 3144.95 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 448 + - - 5 + - 3850.58 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 448 + - - 0 + - 3858.56 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 704 + - - 5 + - 3711.98 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1856 + - - 4 + - 4106.89 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 704 + - - 5 + - 4074.94 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 2368 + - - 5 + - 2621.52 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2483.94 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 704 + - 5056 + - - 2 + - 3789.96 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 4 + - - 6 + - 36.9678 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 704 + - - 5 + - 1049.2 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 6784 + - - 6 + - 212.208 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 448 + - 5888 + - - 3 + - 3613.02 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 6784 + - - 0 + - 3717.66 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1408 + - - 5 + - 679.986 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1024 + - - 3 + - 3486.08 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 4288 + - - 4 + - 4312.4 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1024 + - - 3 + - 2795.61 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3559.29 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 5056 + - - 0 + - 3782.95 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 704 + - - 2 + - 3794.09 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 64 + - 448 + - - 5 + - 299.1 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1408 + - - 1 + - 3981.44 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 4288 + - - 0 + - 3447.47 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 2368 + - - 1 + - 4091.67 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1856 + - - 5 + - 3862.57 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1408 + - - 5 + - 2787.45 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 704 + - - 0 + - 3037.72 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 128 + - 128 + - - 5 + - 172.036 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 2944 + - - 3 + - 3805.83 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 4 + - - 6 + - 39.1339 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1856 + - - 6 + - 69.724 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 64 + - - 5 + - 2133.52 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 4 + - - 6 + - 66.0936 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 2368 + - - 3 + - 3855.84 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 704 + - - 3 + - 3804.97 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1856 + - - 3 + - 2752.33 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 2944 + - - 1 + - 4202.29 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 3584 + - - 2 + - 3543.21 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3584 + - - 0 + - 3528.38 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 3584 + - - 0 + - 3435.87 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 2368 + - - 3 + - 3965.76 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1024 + - - 5 + - 1575.26 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1024 + - - 0 + - 496.33 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 4288 + - - 5 + - 2371.5 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 704 + - - 3 + - 3035.65 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 4 + - 2368 + - - 6 + - 66.8813 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 5888 + - - 0 + - 3289.92 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 2944 + - - 2 + - 4250.44 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 5056 + - - 1 + - 4256.68 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 5888 + - - 5 + - 3876.51 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 3584 + - - 2 + - 4251.54 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 4 + - - 6 + - 67.2311 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 2368 + - - 5 + - 1820.1 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1856 + - - 3 + - 3828.99 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 4 + - - 6 + - 118.07 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 4 + - 128 + - - 6 + - 4.4929 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 128 + - - 5 + - 2665.48 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 4288 + - - 4 + - 4324.92 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 4 + - - 6 + - 126.945 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 5056 + - - 1 + - 4245.26 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 4 + - - 6 + - 26.6986 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 6784 + - - 3 + - 3678.82 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 64 + - 3584 + - - 0 + - 1484.44 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 2368 + - - 3 + - 4141.21 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1024 + - - 3 + - 3301.25 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 3543.23 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 2388.63 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 1387.47 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 4 + - - 6 + - 53.9165 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 2935.16 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 4288 + - - 3 + - 3851.88 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1856 + - - 6 + - 67.8511 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 64 + - - 5 + - 2243.33 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 0 + - 126.926 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 704 + - - 3 + - 3364.54 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1024 + - - 3 + - 2373.69 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 5056 + - - 4 + - 4413.13 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 64 + - 128 + - - 0 + - 85.7244 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 5888 + - - 1 + - 4286.35 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 4288 + - - 6 + - 142.313 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 2368 + - - 5 + - 4100.03 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 4288 + - - 6 + - 147.689 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1856 + - - 5 + - 1372.62 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 2368 + - - 5 + - 2700.41 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 64 + - 5056 + - - 5 + - 1749.11 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 448 + - 4 + - - 6 + - 14.6511 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 128 + - 4 + - - 6 + - 5.31222 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 4 + - 5056 + - - 6 + - 132.49 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 128 + - - 0 + - 99.6225 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1856 + - - 6 + - 67.8806 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 5056 + - - 0 + - 3677.35 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 5056 + - - 4 + - 4067.5 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 2944 + - - 1 + - 4114.77 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1024 + - - 3 + - 2363.6 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 4 + - 4 + - - 6 + - 0.132643 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 4 + - 2368 + - - 6 + - 80.2433 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1408 + - - 5 + - 3129.04 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 2368 + - - 1 + - 4027.48 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 5056 + - - 3 + - 3935.93 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 5056 + - - 1 + - 4326.23 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 2368 + - - 3 + - 4103.96 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 5888 + - - 4 + - 4318.6 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 2368 + - - 1 + - 4104.1 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1024 + - - 4 + - 3324.52 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 5056 + - - 4 + - 4222.28 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 448 + - - 5 + - 1387.06 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 6784 + - - 0 + - 3724.13 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 4 + - - 6 + - 210.45 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 4097.23 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 128 + - - 5 + - 2764.34 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1856 + - - 3 + - 3881.01 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 122.06 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 5888 + - - 5 + - 3782.58 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 4042.23 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 5888 + - - 1 + - 4317.1 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 4 + - 64 + - - 6 + - 2.70127 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 128 + - 4288 + - - 5 + - 1921.77 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1408 + - - 3 + - 3836.14 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 6784 + - - 1 + - 4388.59 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 5888 + - - 0 + - 3963.54 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 5888 + - - 0 + - 3239.97 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 64 + - - 0 + - 2790.18 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 5888 + - - 3 + - 3700.3 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1024 + - - 2 + - 3401.63 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1024 + - - 0 + - 1944.01 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1856 + - - 0 + - 1225.2 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 4288 + - - 3 + - 4055.91 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 6784 + - - 1 + - 4409.39 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1408 + - - 3 + - 4118.01 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 4288 + - - 3 + - 4113.12 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 448 + - - 5 + - 2725.95 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1024 + - - 4 + - 3581.47 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1856 + - - 4 + - 4265.51 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 4 + - 64 + - - 6 + - 2.20612 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1408 + - - 0 + - 2152.47 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 5888 + - - 3 + - 3949.97 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 4288 + - - 3 + - 3776.65 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3584 + - - 0 + - 2703.7 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 2368 + - - 3 + - 3976.11 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 5056 + - - 2 + - 4200.55 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1408 + - - 3 + - 4043.67 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 5888 + - - 4 + - 4261.96 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 5888 + - - 3 + - 4092.65 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 704 + - - 5 + - 3815.54 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 448 + - - 0 + - 3430.22 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 256 + - - 5 + - 3108.26 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 128 + - 2944 + - - 0 + - 1985.29 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 5056 + - - 5 + - 2858.07 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 4 + - - 6 + - 112.177 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 1238.66 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 2944 + - - 6 + - 106.164 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1024 + - - 2 + - 3925.16 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 2944 + - - 0 + - 3738.38 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 704 + - - 5 + - 3710.59 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 448 + - 4288 + - - 5 + - 3800.78 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 448 + - - 0 + - 3789.71 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 704 + - - 0 + - 3561.84 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 2944 + - - 5 + - 3909.2 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 4 + - - 6 + - 182.654 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 64 + - 4 + - - 6 + - 2.62659 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 6784 + - - 1 + - 4399.29 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 128 + - - 0 + - 382.627 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 128 + - - 5 + - 2158.21 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 2944 + - - 4 + - 4193.73 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 6784 + - - 1 + - 4273.81 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 704 + - - 5 + - 1238.83 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1408 + - - 3 + - 3906.13 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 5888 + - - 1 + - 4349.57 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 5888 + - - 0 + - 3569.22 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1856 + - - 4 + - 4095.42 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 128 + - - 5 + - 948.368 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1408 + - - 5 + - 4093.9 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 448 + - - 5 + - 2518.46 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4288 + - - 3 + - 2591.66 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 4 + - - 6 + - 18.2679 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1856 + - - 0 + - 3509.68 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 448 + - 5056 + - - 3 + - 3644.56 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1856 + - - 3 + - 3310.94 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1408 + - - 6 + - 51.6418 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 64 + - - 5 + - 49.4489 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1856 + - - 5 + - 2664.59 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 6784 + - - 1 + - 4351.47 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 128 + - 6784 + - - 3 + - 2817.05 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 64 + - 5056 + - - 5 + - 2395.32 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1408 + - - 0 + - 3688.14 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 4 + - - 6 + - 94.74 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 4 + - 6784 + - - 6 + - 166.161 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 128 + - 64 + - - 5 + - 86.5101 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 448 + - - 0 + - 3628.55 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 704 + - - 0 + - 3535.45 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1408 + - - 1 + - 4141.53 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 704 + - - 5 + - 3661.36 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1024 + - - 4 + - 3607.26 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 5888 + - - 4 + - 4288.02 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 4288 + - - 1 + - 4204.24 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 2368 + - - 5 + - 4152.44 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 2944 + - - 0 + - 3627.43 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 4 + - - 6 + - 188.591 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 4 + - 4288 + - - 6 + - 132.797 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 3584 + - - 2 + - 3968.31 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 2944 + - - 0 + - 3632.22 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 4288 + - - 4 + - 4282.99 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 4 + - - 6 + - 0.183805 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1408 + - - 0 + - 2043.93 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1408 + - - 3 + - 3908.87 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1024 + - - 5 + - 2971.61 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2793.03 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 3584 + - - 0 + - 3726.19 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1408 + - - 6 + - 54.6578 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 704 + - - 5 + - 3816.87 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 704 + - 448 + - - 5 + - 2344.93 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 448 + - - 0 + - 3674.29 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 128 + - - 5 + - 1569.46 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 256 + - 3584 + - - 0 + - 3484.11 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 347.676 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1856 + - - 4 + - 4220.72 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1024 + - - 6 + - 37.5087 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 2944 + - - 1 + - 4297.39 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1856 + - - 1 + - 3871.56 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 4 + - 3584 + - - 6 + - 114.403 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1024 + - - 4 + - 3313.85 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 601.949 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 704 + - - 0 + - 3130.33 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 5056 + - - 6 + - 173.395 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 128 + - - 5 + - 1984.85 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 5056 + - - 4 + - 4116.81 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 5888 + - - 3 + - 4135.04 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1024 + - - 4 + - 3696.76 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1856 + - - 3 + - 3997.78 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 5056 + - - 2 + - 4053.86 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 686.243 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1856 + - - 3 + - 4057.75 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 4288 + - - 3 + - 4109.55 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 4 + - - 6 + - 122.487 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 5888 + - - 3 + - 3991.21 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 128 + - - 5 + - 3906.41 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 4286.38 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 2368 + - - 3 + - 4145.31 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1408 + - - 3 + - 3961.42 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 3 + - 3018.28 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 448 + - - 5 + - 347.743 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 5888 + - - 3 + - 3945.17 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 448 + - - 5 + - 2614.85 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 64 + - - 5 + - 1230.48 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1024 + - - 1 + - 3550.41 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1408 + - - 0 + - 2967.53 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1408 + - - 3 + - 4170.01 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 128 + - - 0 + - 2247.88 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 4288 + - - 4 + - 4346.55 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1408 + - - 3 + - 2123.86 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 696.352 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5888 + - - 3 + - 2749.88 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 448 + - - 0 + - 669.201 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 4 + - - 6 + - 52.2966 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 795.382 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 4 + - 448 + - - 6 + - 14.8561 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3584 + - - 2 + - 4172.03 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 4288 + - - 3 + - 3968.91 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 4 + - - 6 + - 36.9126 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 704 + - - 0 + - 2050.29 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 704 + - - 3 + - 3498.86 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 4 + - 448 + - - 6 + - 18.5261 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 448 + - - 5 + - 861.912 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1408 + - - 5 + - 1045.36 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 704 + - - 6 + - 29.7186 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 6784 + - - 1 + - 4332.96 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 3 + - 2708.49 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 4 + - - 6 + - 66.6622 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 2944 + - - 0 + - 3742.3 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 64 + - - 5 + - 1491.88 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 6784 + - - 1 + - 4317.81 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 11.2672 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 6784 + - - 1 + - 4111.36 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 704 + - - 3 + - 3985.35 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 64 + - - 5 + - 1046.04 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 4 + - - 7 + - 83.4965 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1024 + - - 4 + - 3399.45 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 3584 + - - 1 + - 3869.75 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 2368 + - - 3 + - 3919.78 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 704 + - - 3 + - 2251.05 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 128 + - - 5 + - 199.564 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 4288 + - - 0 + - 3788.4 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1856 + - - 0 + - 3742.99 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 128 + - 2368 + - - 5 + - 2251.59 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1856 + - - 0 + - 3686.3 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 64 + - - 0 + - 1818.98 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 64 + - 128 + - - 5 + - 59.2016 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 6784 + - - 4 + - 4172.14 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1024 + - - 2 + - 4165.04 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 2049.32 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 4 + - - 6 + - 19.5435 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 2368 + - - 3 + - 4015.31 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1856 + - - 3 + - 3939.11 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1024 + - - 4 + - 2985.41 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 704 + - - 5 + - 2772.32 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 448 + - 4288 + - - 3 + - 3442.58 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1408 + - - 5 + - 1794.77 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 3584 + - - 1 + - 4084.55 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 4 + - - 6 + - 51.0511 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1408 + - - 0 + - 3398.36 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 5888 + - - 1 + - 4179.61 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1024 + - - 2 + - 3301.45 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 3584 + - - 1 + - 3823.13 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 448 + - - 5 + - 3743.66 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 5056 + - - 0 + - 3987.33 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 5056 + - - 3 + - 3985.79 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 256 + - - 3 + - 3499.15 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1024 + - - 2 + - 3963.02 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 3584 + - - 0 + - 3843.44 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 704 + - 5888 + - - 3 + - 3834.02 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 6784 + - - 4 + - 4259.17 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 5056 + - - 3 + - 4112.46 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 4 + - - 6 + - 146.59 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 64 + - 2944 + - - 5 + - 1858.36 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 3584 + - - 1 + - 4114.91 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1024 + - - 3 + - 2943.69 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 5888 + - - 2 + - 4413.74 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 4 + - - 6 + - 83.8565 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 128 + - - 3 + - 2193.79 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 5056 + - - 1 + - 4255.61 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 4288 + - - 4 + - 4085.74 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 6784 + - - 1 + - 4350.26 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 4288 + - - 3 + - 3955.83 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1408 + - - 5 + - 3746.6 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 256 + - - 5 + - 2264.66 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 704 + - - 3 + - 3247.55 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 4288 + - - 0 + - 4212.78 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 6784 + - - 3 + - 4072.95 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 5888 + - - 2 + - 4157.73 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 128 + - - 3 + - 2456.1 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 345.423 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1024 + - - 0 + - 954.555 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 4 + - 5888 + - - 6 + - 174.397 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 5888 + - - 5 + - 3187.19 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 2944 + - - 3 + - 3534.91 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 64 + - 256 + - - 5 + - 171.026 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 128 + - - 5 + - 1507.66 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1024 + - - 3 + - 3695.39 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 2157.43 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 2944 + - - 1 + - 4216.23 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 6784 + - - 1 + - 4359.85 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 128 + - - 0 + - 2817.72 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 2368 + - - 3 + - 4114.79 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1856 + - - 0 + - 3627.79 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 64 + - - 5 + - 3079.63 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 4 + - - 6 + - 69.1257 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 2944 + - - 5 + - 3779.01 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1856 + - - 5 + - 1554.43 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 4268.82 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 64 + - 4288 + - - 5 + - 1490.3 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1856 + - - 1 + - 4017.69 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1408 + - - 3 + - 3682.75 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 448 + - - 3 + - 3386.34 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1408 + - - 3 + - 3195.56 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 704 + - - 0 + - 3140.55 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 4288 + - - 4 + - 4285.06 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 5056 + - - 1 + - 4273.65 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1856 + - - 5 + - 3711.26 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 4 + - - 6 + - 2.86579 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 2944 + - - 2 + - 4122.76 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 448 + - - 3 + - 3642.0 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 4288 + - - 3 + - 4043.21 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 704 + - - 0 + - 3785.63 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 4 + - - 6 + - 29.3126 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 3584 + - - 0 + - 2541.32 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 4239.29 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 5888 + - - 4 + - 4125.3 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 64 + - - 5 + - 2247.13 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 128 + - - 5 + - 1050.62 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 2944 + - - 3 + - 3832.33 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 128 + - - 5 + - 3255.81 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2543.53 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 2368 + - - 3 + - 3977.51 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 2368 + - - 3 + - 3470.98 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 4288 + - - 3 + - 4017.6 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1408 + - - 5 + - 3976.29 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 5888 + - - 1 + - 4280.99 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 2368 + - - 3 + - 4106.89 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 64 + - 2368 + - - 0 + - 1531.69 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 128 + - - 0 + - 398.133 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 6784 + - - 4 + - 4188.38 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1856 + - - 4 + - 4279.32 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1856 + - - 3 + - 3845.33 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 2622.83 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 2368 + - - 5 + - 4199.02 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 64 + - - 5 + - 886.036 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 64 + - - 6 + - 2.94754 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 4288 + - - 4 + - 4241.8 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 4280.4 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1408 + - - 5 + - 1090.28 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1024 + - - 0 + - 1509.32 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 128 + - 5888 + - - 3 + - 2493.35 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 64 + - - 5 + - 2551.58 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1024 + - - 0 + - 682.324 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 6784 + - - 3 + - 3896.62 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 448 + - 3584 + - - 5 + - 3216.81 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 5056 + - - 3 + - 4103.68 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 448 + - - 0 + - 3908.97 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1856 + - - 0 + - 3414.84 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 704 + - - 3 + - 4058.86 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 448 + - - 0 + - 3268.86 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1408 + - - 3 + - 4002.72 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 190.71 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 448 + - 5056 + - - 3 + - 3357.35 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 448 + - - 5 + - 3338.97 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 128 + - 4288 + - - 0 + - 2480.52 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 2918.04 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1024 + - - 5 + - 2301.92 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 3584 + - - 5 + - 3747.36 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 448 + - - 0 + - 3978.56 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 3 + - 2843.69 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 704 + - 4288 + - - 5 + - 3650.35 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 6784 + - - 1 + - 4427.56 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 2944 + - - 5 + - 3950.8 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 128 + - - 5 + - 2305.25 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 5888 + - - 3 + - 4180.56 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 3584 + - - 6 + - 123.765 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 448 + - 2368 + - - 0 + - 3094.47 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 64 + - - 5 + - 1975.32 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 704 + - - 3 + - 3103.64 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 11.594 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 5056 + - - 0 + - 3887.05 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 5056 + - - 3 + - 3991.07 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 64 + - 6784 + - - 0 + - 2242.84 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 6784 + - - 1 + - 4184.84 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 5888 + - - 4 + - 4389.36 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 2368 + - - 3 + - 3876.97 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 4288 + - - 1 + - 4226.88 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 5056 + - - 2 + - 4243.0 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 448 + - - 5 + - 2269.53 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 3584 + - - 1 + - 3876.57 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1408 + - - 3 + - 3915.02 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 4 + - - 6 + - 5.69094 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 3286.4 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1856 + - - 1 + - 4082.85 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 4 + - - 6 + - 79.0114 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 2368 + - - 3 + - 3926.34 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 2368 + - - 3 + - 4061.34 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 6784 + - - 2 + - 3967.47 +- null diff --git a/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml b/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml new file mode 100644 index 000000000..9fbec69f6 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml @@ -0,0 +1,11955 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 8 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x64x8_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 16 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x64x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 85.8659 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 6 + - 126.0 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4131.48 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4428.58 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 4 + - 2372.29 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 702.051 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 2207.44 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4346.21 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 175.395 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 4 + - 2084.25 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 3531.52 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3987.08 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 4.47573 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 6 + - 160.867 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4148.65 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 3974.74 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3529.36 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 11.3224 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 3008.68 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4164.25 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1371.73 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 2639.09 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 116.897 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 4 + - 3241.07 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 2 + - 2702.65 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 1 + - 3799.9 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4458.37 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 4 + - 3455.76 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4155.22 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 4 + - 1796.4 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4428.83 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4082.8 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 3944.77 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 18.26 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4419.18 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 2263.71 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 11.1269 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 973.122 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 0 + - 3521.12 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 7 + - 66.6068 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 4 + - 1399.93 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3551.99 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3999.21 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3965.86 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4140.72 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3463.37 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 599.676 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 6 + - 98.756 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4195.0 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4276.85 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 3113.24 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 4 + - 2069.13 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4297.69 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4351.4 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4404.1 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 2787.8 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 108.888 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4154.23 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 4 + - 3212.76 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 2 + - 2909.47 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3644.19 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 134.921 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 3294.38 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2967.8 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 3715.59 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 3532.34 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4228.72 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 1644.0 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 4111.2 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 2007.27 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 1839.47 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 17.7941 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4233.35 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 640.322 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 38.1032 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4339.85 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 133.74 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 5.31723 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2846.54 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3601.5 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 1 + - 4139.06 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 6 + - 112.043 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4209.45 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 545.16 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 7 + - 0.129381 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 171.592 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4380.51 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 83.6644 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 3807.05 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 3971.62 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 3989.46 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 4 + - 1828.11 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 4 + - 2152.29 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4420.97 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 4 + - 3792.89 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 4345.66 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 18.1234 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 1237.32 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 3870.81 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 2177.8 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 3253.82 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 311.788 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 3358.09 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4173.86 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 4 + - 3135.3 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 299.14 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 4 + - 1771.61 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 617.859 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4499.41 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 3912.61 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4491.07 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 3361.78 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 6 + - 86.4953 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 3504.5 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 3931.48 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 83.6254 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 2 + - 3128.48 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 156.691 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4238.65 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4376.43 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4330.46 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 2.5886 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4220.07 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 4 + - 3152.32 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 3465.0 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 2224.62 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 2074.01 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 1193.48 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3252.91 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 1844.0 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 237.342 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 4 + - 2442.01 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4162.27 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 342.225 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 323.901 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 3974.28 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3420.33 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 66.3638 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 270.81 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 1308.95 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3960.37 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 3827.66 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 2 + - 2984.7 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4045.85 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 2 + - 3159.54 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 4 + - 3337.75 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4438.26 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4371.87 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 117.712 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 65.2676 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3983.44 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3420.08 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 2003.53 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4290.62 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 486.923 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4212.23 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4368.14 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 2 + - 3616.37 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3612.48 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 2 + - 3591.67 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3478.54 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 177.026 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 6 + - 146.766 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 1278.81 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 971.81 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 2 + - 2876.7 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 4240.96 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4318.06 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 2 + - 2208.57 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 2917.28 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4238.0 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 2.8551 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 2581.76 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 2 + - 3438.52 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 2855.58 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4304.2 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 6 + - 68.3931 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 3847.09 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 106.38 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 4 + - 3466.6 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 3818.04 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 2706.07 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4390.57 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 973.223 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 2520.87 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 1 + - 4031.16 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4211.28 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 3917.47 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 1081.82 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4391.63 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 4 + - 1603.55 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 2 + - 3073.59 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1016.7 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4032.15 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 4 + - 2018.81 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 0 + - 3578.48 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 105.872 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 28.5936 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 641.842 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4166.77 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 7 + - 152.668 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 3889.62 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 2909.64 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4240.33 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4398.42 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 2 + - 3127.64 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 2789.69 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1472.72 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4427.89 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 1746.49 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3335.98 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 4 + - 2491.91 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4286.95 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4513.2 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 3905.23 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 2501.33 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4320.44 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3847.15 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4450.1 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 1562.15 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 4078.36 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 813.39 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 10.5545 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 3404.04 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3878.26 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 3096.47 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 4 + - 2839.65 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 3949.79 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 1 + - 3620.54 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4291.23 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 2 + - 2716.72 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3600.09 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4134.21 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4219.34 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 3591.88 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 3883.36 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3562.83 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4303.51 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 1 + - 3964.3 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4132.39 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 4 + - 3524.34 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 2 + - 3183.53 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 2 + - 2681.31 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 2744.04 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 3700.79 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4237.23 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 2671.88 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 2392.8 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4301.81 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 2 + - 3587.41 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4287.93 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 1 + - 4062.15 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4230.32 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 3154.27 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4033.56 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4341.11 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4203.36 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 907.203 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 4 + - 1165.24 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3858.51 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3872.4 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 2312.38 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3536.18 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 19.4596 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4407.57 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 4 + - 3548.1 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 4 + - 3538.51 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 0 + - 3876.59 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 4 + - 3620.31 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 37.2908 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2522.63 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 2283.9 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 177.085 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4482.96 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3189.17 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 469.436 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4089.54 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 4 + - 3595.4 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 85.5961 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4210.42 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3599.65 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 145.789 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 3864.67 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3047.55 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 1392.8 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 1 + - 3840.63 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 3890.05 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4019.7 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 4200.22 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3626.32 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 113.139 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4208.82 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4115.61 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4291.24 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 4 + - 1825.87 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3803.13 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 4 + - 3713.96 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 466.587 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 941.001 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 122.644 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 2830.82 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4550.77 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 2 + - 2813.17 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3212.09 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 3659.11 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 4 + - 1117.38 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 5 + - 3850.82 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4293.64 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4372.66 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3314.5 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 65.7843 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 77.2831 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3472.0 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4484.4 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 42.0475 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 3521.99 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4305.4 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 39.5969 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 3783.92 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4220.54 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 3812.62 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 1925.91 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 26.4778 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 3581.57 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 69.3786 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 3875.64 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 2396.93 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 5 + - 3643.55 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3837.09 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 2930.26 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 3981.74 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 1500.98 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4406.67 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 1 + - 3964.6 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 153.951 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2004.6 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 6 + - 39.0944 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 3591.41 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3503.53 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 6 + - 65.2871 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3556.53 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4335.45 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 3884.18 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 3209.76 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 310.113 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4338.32 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 4 + - 1232.18 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 4 + - 458.427 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 855.55 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3777.0 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 4 + - 2296.02 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4170.19 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4382.03 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 37.6909 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 2 + - 3136.93 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3989.26 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4251.7 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4436.7 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 2 + - 3257.99 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3273.65 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 5 + - 3925.06 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 5.57925 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4510.07 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4092.01 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 3314.93 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4390.69 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 0 + - 3183.94 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 3650.6 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4221.88 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4185.39 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 3839.13 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 1635.92 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1819.52 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 2847.72 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 4 + - 3528.36 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 5 + - 4034.28 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 3942.86 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 4 + - 884.75 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3403.68 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 2 + - 3373.25 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4407.27 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3791.92 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4439.62 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 707.811 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3320.49 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 4 + - 2824.93 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3306.71 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 4 + - 3386.86 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 2901.12 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 2365.11 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4220.64 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 1919.23 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 4 + - 2654.59 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4099.85 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4235.16 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 6 + - 141.164 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 1561.99 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 6 + - 163.726 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 3243.82 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4262.05 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 620.839 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 6 + - 122.084 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 4146.4 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3645.2 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 3092.71 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 972.701 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 4 + - 2004.99 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 940.27 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 2819.19 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 3158.57 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 2 + - 2422.91 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4352.68 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1114.25 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 4 + - 3282.36 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3516.01 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 3392.83 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 50.9029 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 323.95 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 2253.61 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 1353.04 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 1929.22 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 2 + - 3587.43 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 0 + - 3835.87 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 706.515 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3440.15 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3885.38 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 5 + - 3824.47 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 3726.59 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 2899.6 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 546.097 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 2810.3 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 4 + - 3308.83 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 1838.35 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 2844.89 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4436.46 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 413.849 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 3834.88 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 4 + - 2072.73 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 3355.64 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4172.09 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 2016.12 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4140.09 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4263.85 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 1175.69 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2921.92 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 4 + - 2420.36 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4470.25 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 18.7769 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 0 + - 3584.48 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 2 + - 3157.79 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 2 + - 3116.27 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 2041.0 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 2004.82 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 2 + - 3368.5 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 2394.34 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3990.62 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4053.64 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 103.51 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 4 + - 2992.13 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 4.3018 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 0 + - 3655.24 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4355.33 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 1 + - 3743.87 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4279.05 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4359.76 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4052.58 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 1 + - 3966.69 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 3961.7 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 413.601 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 4 + - 3466.5 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 3298.18 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3834.83 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 2681.82 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 2293.28 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3383.62 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 3942.93 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1504.24 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 2005.1 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 2842.87 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 3944.01 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4505.84 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 2598.79 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 4 + - 2849.46 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 3799.8 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 3109.47 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 1666.17 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 2 + - 2697.01 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 3757.73 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 88.8594 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 1755.18 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 6 + - 216.435 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 4174.1 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 2673.84 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4413.93 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4071.28 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 2915.75 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 3194.29 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4344.42 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 599.545 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 51.9619 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4358.44 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 75.0678 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2456.82 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 3914.79 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 6 + - 210.043 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 355.184 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 1 + - 4222.24 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3766.21 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2309.9 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4375.64 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4400.81 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 3512.95 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4372.96 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 2 + - 3314.6 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 2788.15 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 2 + - 3470.94 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4224.05 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 426.706 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 4 + - 1212.98 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4383.27 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4170.99 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 6 + - 20.853 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4219.89 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4305.85 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 2414.41 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 27.5612 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 3823.27 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 0.180014 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 2709.42 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 6 + - 66.4912 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 26.8365 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2846.36 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 486.132 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 2870.45 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4284.18 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 1237.36 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 161.971 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 473.754 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 14.7922 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4378.69 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 39.3219 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 2 + - 3374.36 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 3922.51 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 1359.35 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 4 + - 831.384 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 1 + - 4049.19 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 6 + - 51.5262 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 1623.91 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 2 + - 3128.25 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4088.11 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4351.11 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 2 + - 2813.9 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3337.32 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 4 + - 3357.67 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4431.33 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 67.3512 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 152.321 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 2349.08 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3386.08 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4445.62 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4382.58 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 0 + - 3199.33 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2971.89 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 853.861 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4384.3 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3948.31 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 645.771 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 29.3082 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4428.83 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 2641.57 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 2 + - 2874.36 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 85.644 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 52.3054 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 3949.66 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 4 + - 3272.76 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 2981.91 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 620.645 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3675.33 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4272.82 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 2151.66 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3446.87 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 4081.81 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 4 + - 1806.81 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4348.63 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 126.157 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 2 + - 3439.18 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 7 + - 65.8728 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 7 + - 168.352 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 0 + - 3955.31 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 2599.16 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 0 + - 3365.12 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4156.25 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 2183.88 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 0.16435 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1817.93 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3986.34 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4467.96 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 3323.07 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4362.75 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 167.985 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 3277.24 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4483.15 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 1 + - 3683.72 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3648.54 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 3 + - 56.6186 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4538.21 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1808.61 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 51.385 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 2136.28 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 3367.09 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4466.18 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4267.7 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 2346.94 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 0 + - 3496.13 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 175.394 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 2106.71 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 3802.5 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2.81138 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 0 + - 3893.42 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 2062.51 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4021.01 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 108.985 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 2997.83 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 3414.13 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 3535.97 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 37.1752 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 2 + - 3608.27 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 3301.8 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 2 + - 3276.15 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 5.68895 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 236.913 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 685.472 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 2815.43 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 2 + - 3158.4 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4449.21 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 1194.04 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 201.767 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3995.15 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 4 + - 2110.15 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 77.2071 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 3346.02 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 102.376 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 4446.59 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 1272.63 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4447.08 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 2 + - 3590.81 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 3653.6 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 2 + - 2350.19 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3925.01 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 2841.71 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3496.59 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 3892.82 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 6 + - 66.4303 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 3841.0 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3700.87 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 67.3682 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 3359.0 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4303.35 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 4 + - 2261.43 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3545.66 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 2917.28 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2408.59 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 311.499 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 113.959 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 28.9247 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 2 + - 3122.59 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 4 + - 2270.31 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 5.19179 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2878.7 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 4 + - 810.993 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 3406.1 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4303.8 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 88.8763 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 4354.35 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3647.79 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 88.0468 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 1797.57 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 5 + - 3546.49 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 4 + - 2842.82 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2272.66 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1603.22 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4248.6 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 2 + - 3105.96 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 158.977 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 1 + - 3789.53 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 13.8983 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 1844.45 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4352.84 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4156.79 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 1558.33 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4201.32 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 4 + - 2526.34 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 6 + - 131.646 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4164.88 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4187.25 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 3955.06 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 2 + - 2990.22 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 2 + - 2332.57 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 19.1452 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 2 + - 2036.99 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 1 + - 4131.84 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 2 + - 2340.12 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4059.02 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 1081.89 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4409.11 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 1 + - 4053.36 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 2125.25 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 829.328 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1199.94 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 2 + - 3186.05 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3064.83 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 3658.24 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4318.46 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3774.09 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 1216.52 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2450.68 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 2229.66 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 0 + - 3632.48 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 1278.57 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 3033.67 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4229.1 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3960.26 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 8.81501 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 1555.19 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 6 + - 187.576 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 4 + - 3593.47 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4309.56 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4241.55 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4438.11 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 0.174666 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 354.956 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3946.94 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 5.61614 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 939.016 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 51.8841 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2602.33 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 3935.01 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 11.1859 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 2 + - 3277.53 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 4 + - 1177.61 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 3337.25 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 2 + - 2596.29 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 3139.9 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 38.8583 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 4 + - 3334.39 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2106.64 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 1396.15 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 3808.46 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4268.92 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 5 + - 4099.11 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 0 + - 3782.42 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 3928.11 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 0 + - 4421.71 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 6 + - 182.008 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4304.59 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4363.64 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 0 + - 3039.91 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 856.058 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 4 + - 2103.1 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 3918.06 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 123.857 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4444.23 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 4 + - 2969.4 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 3903.79 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 4 + - 1693.52 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4175.34 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 3720.08 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 0 + - 4035.78 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 1228.64 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 11.0129 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 5 + - 3953.81 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 3985.78 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 1925.05 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 3010.0 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 309.78 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 3735.58 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4027.83 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 3636.0 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 93.6675 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2399.17 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3423.39 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3767.34 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 0 + - 2839.1 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 6 + - 193.705 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 1630.78 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4522.67 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 6 + - 146.003 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 3335.1 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 4 + - 3345.53 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1398.58 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 2315.01 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3727.86 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4447.64 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4193.48 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3535.31 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 1 + - 3783.23 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4293.49 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 4022.27 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3177.71 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 2846.98 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3475.39 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 2 + - 2576.59 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 3718.73 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4304.38 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 4318.24 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 10.3916 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 683.982 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4161.2 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4475.37 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 3254.98 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 0 + - 4534.9 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4294.38 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4213.48 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2528.34 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4497.43 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 0 + - 3206.99 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 299.391 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 5.5019 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 136.946 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4211.69 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4157.48 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 78.2187 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4210.24 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 4 + - 2094.36 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4166.93 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 5 + - 3897.19 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 2736.65 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4272.96 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 6 + - 81.3897 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 1640.78 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 3594.0 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3111.99 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 1924.71 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 170.244 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 6 + - 167.88 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4174.21 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2483.92 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 1625.03 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 4 + - 2454.36 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 8.53043 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 0 + - 4196.47 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 622.67 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3337.02 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 2414.36 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 3958.29 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4525.65 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 99.0835 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 3725.24 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 0 + - 4236.78 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 2 + - 2851.2 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 6 + - 65.8084 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 4 + - 622.464 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 4 + - 1368.6 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3636.78 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 0 + - 3329.6 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 1 + - 3788.13 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 5 + - 3390.79 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4287.42 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 2.16568 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 0 + - 3715.85 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 2090.83 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4215.1 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 81.9089 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 55.3903 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4159.21 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3842.26 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 4 + - 2501.76 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 2268.93 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4132.9 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 4 + - 2308.35 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4086.19 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 4012.17 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4404.48 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 0 + - 4455.05 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 0 + - 4354.7 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 2862.5 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 1230.09 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 1 + - 3902.67 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4478.32 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 4202.39 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 2.74515 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 2892.5 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 4 + - 2817.72 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1681.35 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3544.68 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 1 + - 3731.44 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2227.05 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 343.249 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4275.42 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 271.006 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 0 + - 3656.22 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 3691.99 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 0 + - 4290.75 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3922.54 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 3839.83 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 2 + - 3432.95 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4393.5 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 3817.28 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 0 + - 3971.4 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 3899.05 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 470.339 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 27.9471 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 0 + - 3766.7 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 0 + - 3917.02 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4152.14 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 0 + - 3593.62 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 4 + - 2017.14 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 4 + - 2020.69 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 6 + - 2.80058 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 1 + - 4055.39 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4432.52 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 4 + - 2152.54 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 4 + - 2459.64 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 0 + - 3892.22 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 3729.64 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 1910.26 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 0 + - 4154.37 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 52.7318 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 936.403 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 100.369 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 3453.74 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1168.07 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 1 + - 4206.35 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4363.46 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4149.06 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 4 + - 3035.07 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 6 + - 117.699 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 2 + - 3160.31 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 4 + - 1996.14 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 0 + - 4131.38 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 3837.64 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 2.66246 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 4 + - 2814.43 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 4 + - 641.081 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 680.725 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 4501.36 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 0 + - 4116.91 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 2 + - 3108.16 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 4 + - 2984.26 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 0 + - 3958.02 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 0 + - 3645.34 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 4 + - 2756.23 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 2914.11 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 0 + - 4387.15 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 4 + - 2732.26 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 1024.58 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 1411.08 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4338.48 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 0 + - 3471.7 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 0 + - 3846.09 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 0 + - 4396.05 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 4 + - 2400.4 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 4 + - 3138.11 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 21.1136 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 2 + - 3439.41 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 4 + - 2729.96 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 2 + - 2796.96 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 3697.35 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 0 + - 3373.74 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 0 + - 4211.32 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 4269.1 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 0 + - 4192.47 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 4 + - 2932.38 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 4 + - 3438.33 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 0 + - 4548.6 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 4 + - 3102.51 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 4 + - 2397.8 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 36.8767 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 1 + - 4029.1 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 3916.04 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 4 + - 1307.18 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 4 + - 3336.43 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 1407.1 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 4386.99 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 0 + - 4401.13 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 4 + - 3134.45 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 3216.63 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 1999.7 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 0 + - 3818.03 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 4 + - 1924.43 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 1 + - 3975.58 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 2 + - 2854.58 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 0 + - 4321.86 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 2 + - 2709.33 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 2011.24 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 2 + - 3140.85 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 6 + - 27.7227 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 4 + - 2968.87 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4055.79 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 0 + - 3921.39 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 1772.15 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 6 + - 119.71 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 4 + - 425.978 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 4 + - 2732.52 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 4 + - 855.437 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 2 + - 3160.79 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4271.18 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 0 + - 4351.49 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 4 + - 3582.75 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 2 + - 2330.02 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 0 + - 4202.58 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4381.18 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 2187.79 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 27.1515 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 4 + - 1835.59 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 4 + - 3805.24 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 4 + - 1477.3 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 0 + - 4424.26 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 2 + - 3441.37 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 6 + - 2.17143 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 3947.1 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 0 + - 4344.96 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 4 + - 1922.23 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 4 + - 204.405 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 0 + - 4346.81 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 0 + - 4192.06 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 5 + - 3864.22 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 53.1812 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 0 + - 3822.01 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 0 + - 3952.49 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 4 + - 2880.04 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 0 + - 4296.1 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 0 + - 3722.34 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 4 + - 44.113 +- null diff --git a/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml b/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml new file mode 100644 index 000000000..dbc90f8fe --- /dev/null +++ b/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml @@ -0,0 +1,11955 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x8_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 32 + LSPA: 16 + LSPB: 8 + LVCA: 16 + LVCB: 32 + LVPA: 16 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x16_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2944 + - - 1 + - 2154.74 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 4288 + - - 1 + - 3395.96 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 2944 + - - 3 + - 4435.68 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 6784 + - - 3 + - 4355.31 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 3584 + - - 1 + - 3460.65 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 128 + - - 1 + - 563.38 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 64 + - - 0 + - 1047.26 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 448 + - - 1 + - 2796.91 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 64 + - - 0 + - 1789.11 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 5056 + - - 3 + - 4344.79 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1856 + - - 6 + - 66.4662 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 2944 + - - 3 + - 3632.79 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 256 + - - 3 + - 3683.52 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 448 + - - 4 + - 4079.75 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 256 + - 4 + - - 6 + - 21.32 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 6784 + - - 3 + - 4200.4 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 768 + - 2368 + - - 1 + - 2651.61 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 128 + - - 1 + - 2051.18 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 6784 + - - 3 + - 3262.44 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 2944 + - - 3 + - 4280.36 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 5056 + - - 3 + - 4263.55 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1024 + - - 3 + - 3688.25 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 768 + - 2368 + - - 1 + - 2050.12 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3584 + - - 4 + - 3622.95 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 448 + - - 4 + - 2802.9 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 64 + - - 0 + - 2268.1 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 128 + - - 1 + - 2796.16 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 3584 + - - 3 + - 3371.91 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 2368 + - - 3 + - 4182.54 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 5056 + - - 2 + - 3967.01 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 6784 + - - 3 + - 4529.68 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 128 + - - 1 + - 3294.07 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 5888 + - - 3 + - 4480.88 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 448 + - - 5 + - 283.064 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 5056 + - - 3 + - 4030.58 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 448 + - - 1 + - 2803.5 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 5888 + - - 3 + - 4316.92 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 704 + - - 2 + - 3809.33 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 448 + - - 1 + - 2430.17 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1024 + - - 0 + - 2632.78 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 4 + - - 7 + - 196.963 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 64 + - - 0 + - 1515.86 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1408 + - - 1 + - 3407.32 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 4 + - - 7 + - 108.621 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 5056 + - - 1 + - 2405.19 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 6784 + - - 3 + - 4201.43 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 704 + - - 5 + - 442.372 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 5056 + - - 3 + - 3769.15 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 2944 + - - 3 + - 3841.79 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 128 + - - 1 + - 3201.65 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1408 + - - 1 + - 3268.26 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 5056 + - - 3 + - 4273.39 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 704 + - - 0 + - 2570.23 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 3584 + - - 3 + - 4159.05 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 768 + - 256 + - - 1 + - 1024.45 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 448 + - - 1 + - 2223.13 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 64 + - - 1 + - 807.878 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 6784 + - - 3 + - 4452.55 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 768 + - 5056 + - - 1 + - 3104.49 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 256 + - - 0 + - 2556.74 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1408 + - - 3 + - 3671.17 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 6784 + - - 3 + - 3805.38 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 64 + - - 1 + - 1642.21 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 256 + - 3584 + - - 6 + - 99.3833 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 3584 + - - 3 + - 3868.8 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 4 + - - 7 + - 83.3113 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1856 + - - 1 + - 2938.77 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 3584 + - - 3 + - 4203.01 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1024 + - - 3 + - 3052.73 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 128 + - - 1 + - 2875.24 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 704 + - - 5 + - 453.438 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1856 + - - 3 + - 4139.24 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 2368 + - - 3 + - 4214.64 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 256 + - - 1 + - 1953.0 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 2368 + - - 1 + - 2253.96 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 4288 + - - 1 + - 2882.61 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 5056 + - - 3 + - 4357.58 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 5056 + - - 1 + - 3385.32 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 5888 + - - 3 + - 3988.22 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1408 + - - 1 + - 1139.91 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 768 + - 5888 + - - 1 + - 2489.62 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 448 + - - 0 + - 1116.51 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 5056 + - - 3 + - 3883.79 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 64 + - - 1 + - 2524.95 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 256 + - 6784 + - - 1 + - 2136.61 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 6784 + - - 3 + - 4405.78 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 256 + - 2944 + - - 3 + - 2845.48 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 5888 + - - 3 + - 4403.69 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1856 + - - 3 + - 4191.92 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 2944 + - - 3 + - 4390.73 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 256 + - 64 + - - 5 + - 326.246 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1856 + - - 1 + - 1428.09 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 4 + - - 6 + - 29.8564 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 704 + - - 6 + - 29.2582 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 768 + - 4 + - - 6 + - 2.64714 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 6784 + - - 3 + - 4454.39 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 256 + - - 1 + - 2754.04 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 256 + - 64 + - - 5 + - 28.3993 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 448 + - - 0 + - 1154.0 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 6784 + - - 6 + - 217.039 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1856 + - - 1 + - 2305.79 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 5056 + - - 3 + - 4215.33 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 4 + - - 6 + - 5.61868 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1856 + - - 1 + - 805.999 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 5056 + - - 3 + - 4366.75 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 4 + - - 6 + - 5.69236 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1408 + - - 0 + - 2556.93 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 4 + - - 6 + - 19.7227 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 256 + - 5888 + - - 6 + - 148.555 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 768 + - 2368 + - - 3 + - 3502.76 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 64 + - - 1 + - 1889.67 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 256 + - - 0 + - 1153.22 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 128 + - - 1 + - 1147.31 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 256 + - 4288 + - - 1 + - 1727.46 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 704 + - - 3 + - 2999.57 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 768 + - 128 + - - 5 + - 300.95 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1024 + - - 3 + - 3791.56 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 4 + - - 6 + - 65.8957 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 2944 + - - 3 + - 4313.69 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 64 + - - 0 + - 1150.65 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 768 + - 5056 + - - 1 + - 2165.45 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 2944 + - - 1 + - 3278.5 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 5056 + - - 3 + - 4129.32 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 256 + - - 1 + - 2650.31 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1024 + - - 6 + - 37.7779 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 3584 + - - 1 + - 3273.25 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 2368 + - - 3 + - 3527.53 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 4288 + - - 3 + - 4149.18 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 64 + - - 1 + - 2478.11 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 768 + - 6784 + - - 3 + - 4196.32 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 256 + - 6784 + - - 1 + - 2424.86 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 64 + - - 0 + - 905.795 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 4 + - - 6 + - 67.2541 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 2368 + - - 3 + - 4152.86 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1024 + - - 3 + - 3629.35 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 4288 + - - 3 + - 4342.31 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 5056 + - - 2 + - 4247.06 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 5888 + - - 6 + - 184.597 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1856 + - - 0 + - 1191.56 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1408 + - - 1 + - 2202.64 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 2368 + - - 2 + - 3783.67 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 704 + - - 1 + - 3339.36 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 256 + - - 1 + - 1784.73 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1856 + - - 3 + - 4155.4 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 2944 + - - 3 + - 3368.85 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3584 + - - 3 + - 4316.78 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1856 + - - 3 + - 3973.93 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 5056 + - - 3 + - 4380.56 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 4288 + - - 3 + - 4148.0 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 3584 + - - 3 + - 4110.84 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1408 + - - 6 + - 53.895 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 128 + - - 1 + - 1764.36 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 128 + - - 1 + - 2220.66 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 256 + - 5056 + - - 1 + - 1633.92 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 704 + - - 3 + - 3611.57 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 768 + - 5888 + - - 6 + - 170.719 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1024 + - - 3 + - 3225.04 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1024 + - - 5 + - 457.694 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 768 + - 4288 + - - 1 + - 2057.12 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 4 + - - 7 + - 223.457 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 5888 + - - 3 + - 4250.39 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 128 + - - 0 + - 879.499 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 2368 + - - 3 + - 3937.39 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 4 + - - 6 + - 113.235 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 768 + - 6784 + - - 3 + - 3632.54 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 4288 + - - 3 + - 4313.24 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 64 + - - 0 + - 2163.14 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 3584 + - - 3 + - 3946.79 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 6784 + - - 3 + - 3947.63 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 64 + - - 0 + - 1873.98 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1408 + - - 3 + - 4063.24 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 5888 + - - 3 + - 4438.31 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 5888 + - - 3 + - 3718.46 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 5888 + - - 6 + - 190.624 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 64 + - - 1 + - 3170.27 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 256 + - - 0 + - 2456.12 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 128 + - - 1 + - 3366.77 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1408 + - - 1 + - 2671.87 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 704 + - - 3 + - 3188.83 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 4 + - - 6 + - 11.4646 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 64 + - - 6 + - 2.82429 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 3584 + - - 3 + - 4280.85 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 4 + - - 7 + - 52.7304 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 704 + - - 4 + - 3360.57 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 5888 + - - 3 + - 3882.54 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 2944 + - - 3 + - 3645.67 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1856 + - - 3 + - 3918.49 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1024 + - - 3 + - 4171.13 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1408 + - - 1 + - 2632.03 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 4288 + - - 3 + - 4386.84 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 704 + - - 6 + - 26.0074 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 2944 + - - 3 + - 4366.27 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 2368 + - - 3 + - 4206.26 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 704 + - - 1 + - 3224.87 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1408 + - - 0 + - 905.46 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 128 + - - 0 + - 1312.42 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 256 + - 128 + - - 6 + - 4.46839 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 448 + - - 4 + - 3421.36 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 4288 + - - 3 + - 4161.56 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 3584 + - - 3 + - 4188.77 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 3584 + - - 0 + - 2058.72 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1024 + - - 0 + - 2831.34 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 6784 + - - 3 + - 4011.74 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 4 + - - 6 + - 2.8399 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 2944 + - - 1 + - 3386.7 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1856 + - - 3 + - 4075.24 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 6784 + - - 1 + - 3769.89 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 6784 + - - 1 + - 3287.92 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 256 + - - 0 + - 2245.04 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 448 + - - 0 + - 2319.18 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 256 + - - 6 + - 11.2366 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 64 + - - 5 + - 81.0254 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 2368 + - - 3 + - 4142.46 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 128 + - - 1 + - 1157.94 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 256 + - 704 + - - 1 + - 1667.69 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1856 + - - 6 + - 68.0864 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 5056 + - - 3 + - 4399.76 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 256 + - 3584 + - - 1 + - 1347.79 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 3584 + - - 2 + - 3825.81 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 256 + - 4288 + - - 3 + - 3467.81 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3584 + - - 1 + - 3418.17 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 256 + - 4 + - - 6 + - 2.22489 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 6784 + - - 3 + - 4509.88 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1856 + - - 3 + - 3814.77 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 768 + - 704 + - - 6 + - 27.5237 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1856 + - - 3 + - 4192.73 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 256 + - - 5 + - 161.14 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1856 + - - 3 + - 3956.52 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 448 + - - 6 + - 18.1699 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1856 + - - 3 + - 4267.85 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 4288 + - - 3 + - 4357.6 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 2944 + - - 3 + - 4385.67 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 64 + - - 1 + - 2878.51 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 4288 + - - 3 + - 3966.55 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1856 + - - 3 + - 3308.7 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 704 + - - 1 + - 2620.62 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 256 + - 3584 + - - 3 + - 3432.35 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 768 + - 4288 + - - 6 + - 128.768 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 5888 + - - 3 + - 3368.33 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 64 + - - 5 + - 282.931 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 2944 + - - 3 + - 2877.95 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 704 + - - 1 + - 3410.53 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 5888 + - - 3 + - 4458.44 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1024 + - - 2 + - 3307.91 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 5888 + - - 1 + - 2883.0 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 2368 + - - 3 + - 4225.4 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1408 + - - 3 + - 4199.74 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 6784 + - - 1 + - 3327.96 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 5888 + - - 3 + - 4401.63 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 4 + - - 7 + - 124.978 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 3584 + - - 3 + - 4393.06 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 704 + - - 0 + - 1721.69 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 704 + - - 0 + - 1793.65 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 256 + - 6784 + - - 3 + - 3040.5 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 3584 + - - 3 + - 4272.38 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1856 + - - 2 + - 3903.7 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 256 + - 704 + - - 1 + - 629.146 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 768 + - 2944 + - - 1 + - 2670.33 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 3584 + - - 3 + - 4352.16 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 2944 + - - 3 + - 4291.83 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 4 + - - 6 + - 0.181889 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 256 + - 3584 + - - 3 + - 3070.9 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1024 + - - 1 + - 1932.18 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 128 + - - 1 + - 2100.19 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 3584 + - - 2 + - 4045.95 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 5056 + - - 3 + - 3925.5 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 2368 + - - 1 + - 2791.14 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 2368 + - - 1 + - 3488.93 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 2368 + - - 3 + - 3659.21 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 2944 + - - 1 + - 3424.01 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 6784 + - - 3 + - 4288.98 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 704 + - - 0 + - 878.708 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 128 + - - 1 + - 2937.36 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 128 + - - 1 + - 3026.12 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1024 + - - 2 + - 3436.13 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 5888 + - - 1 + - 2773.74 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 256 + - 6784 + - - 6 + - 165.233 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 768 + - 448 + - - 1 + - 1712.88 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 768 + - 4 + - - 6 + - 0.162793 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 768 + - 128 + - - 5 + - 75.5218 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 448 + - - 4 + - 4021.56 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 4288 + - - 6 + - 142.555 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1856 + - - 0 + - 1149.13 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 5056 + - - 3 + - 4204.4 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 768 + - 3584 + - - 3 + - 3726.1 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1856 + - - 0 + - 2190.11 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 4 + - - 6 + - 29.0197 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1024 + - - 3 + - 4013.7 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 2368 + - - 3 + - 4340.68 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1408 + - - 1 + - 2736.93 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1408 + - - 3 + - 3850.38 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 3584 + - - 3 + - 4344.8 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 256 + - - 1 + - 2024.05 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 5056 + - - 3 + - 4159.28 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 4 + - - 6 + - 65.3819 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 5888 + - - 3 + - 4019.57 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 6784 + - - 2 + - 3444.28 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 6784 + - - 3 + - 4364.07 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 448 + - - 5 + - 291.058 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 4288 + - - 3 + - 4339.01 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 1 + - 2126.49 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 256 + - 4 + - - 7 + - 0.128731 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 256 + - 5056 + - - 1 + - 1880.73 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 704 + - - 1 + - 2429.39 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 5056 + - - 2 + - 4006.44 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 704 + - - 3 + - 3701.68 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 3584 + - - 1 + - 2553.65 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 704 + - - 0 + - 2044.13 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 2944 + - - 3 + - 4345.89 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 704 + - - 4 + - 2876.54 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 5056 + - - 3 + - 4164.94 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 6784 + - - 3 + - 3831.27 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 704 + - - 2 + - 4035.03 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 4 + - - 7 + - 68.8263 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 5 + - 240.095 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 128 + - - 6 + - 5.67092 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 448 + - - 1 + - 2937.04 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 768 + - 256 + - - 1 + - 591.71 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 704 + - - 3 + - 3574.11 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 2944 + - - 1 + - 3225.64 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 768 + - 128 + - - 6 + - 5.38123 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1856 + - - 1 + - 3839.58 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 768 + - 2368 + - - 0 + - 1313.72 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1024 + - - 4 + - 1993.81 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 768 + - 2944 + - - 1 + - 3168.14 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 256 + - - 3 + - 3871.85 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 4288 + - - 3 + - 3935.49 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 5056 + - - 6 + - 161.735 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 2368 + - - 6 + - 83.9317 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 768 + - 64 + - - 5 + - 36.7607 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 256 + - 5888 + - - 3 + - 3569.55 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 448 + - - 1 + - 3436.67 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 128 + - - 5 + - 579.833 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 4288 + - - 3 + - 4081.96 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 448 + - - 0 + - 1876.64 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 768 + - 3584 + - - 6 + - 113.916 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1856 + - - 1 + - 3468.52 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 2368 + - - 4 + - 3200.91 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 4288 + - - 3 + - 3757.2 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 3584 + - - 3 + - 4462.71 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1024 + - - 0 + - 1148.01 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 2368 + - - 3 + - 4286.56 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 5056 + - - 3 + - 4019.88 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 256 + - - 3 + - 2874.91 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 704 + - - 3 + - 3642.1 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1408 + - - 3 + - 4126.68 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 4288 + - - 3 + - 4202.98 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1408 + - - 1 + - 2430.78 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 2944 + - - 0 + - 1866.99 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 704 + - - 3 + - 3763.87 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 256 + - - 3 + - 2905.69 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1024 + - - 2 + - 3822.56 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 768 + - 3584 + - - 3 + - 3431.96 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 4 + - - 7 + - 39.5375 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 5888 + - - 3 + - 4507.94 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1408 + - - 3 + - 3898.93 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 4 + - - 7 + - 170.756 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 4288 + - - 3 + - 3374.76 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1024 + - - 1 + - 2216.42 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 5888 + - - 3 + - 3930.65 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 4 + - - 7 + - 104.183 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 4288 + - - 3 + - 4125.72 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 3 + - 2160.26 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 256 + - 64 + - - 5 + - 60.2538 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 4288 + - - 3 + - 4027.28 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1408 + - - 3 + - 4378.95 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 704 + - - 1 + - 3286.15 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 6784 + - - 3 + - 4441.24 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 256 + - - 1 + - 2678.37 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 2944 + - - 1 + - 2942.25 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1408 + - - 0 + - 2341.96 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1408 + - - 2 + - 3788.99 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 4 + - - 6 + - 165.457 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 64 + - - 1 + - 2035.75 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 448 + - - 3 + - 3555.74 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 768 + - 448 + - - 1 + - 2130.93 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1024 + - - 2 + - 3852.56 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 128 + - - 0 + - 2379.48 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 448 + - - 1 + - 2311.36 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1024 + - - 3 + - 3391.1 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1856 + - - 3 + - 4096.69 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 768 + - 5056 + - - 1 + - 3324.43 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1024 + - - 3 + - 3658.76 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 5888 + - - 3 + - 3321.44 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 6784 + - - 3 + - 4481.65 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1856 + - - 2 + - 3841.78 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 128 + - - 0 + - 907.989 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 64 + - - 6 + - 2.86677 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1856 + - - 3 + - 4256.24 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1856 + - - 0 + - 2321.69 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 128 + - - 0 + - 2351.94 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 5888 + - - 3 + - 4275.32 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 6784 + - - 3 + - 4392.73 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 4288 + - - 3 + - 4299.86 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 3584 + - - 3 + - 3221.43 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3584 + - - 3 + - 3588.19 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 448 + - - 5 + - 562.969 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 4288 + - - 3 + - 4427.91 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 64 + - - 0 + - 1596.37 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 5888 + - - 3 + - 4218.99 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 5888 + - - 3 + - 4304.8 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 5888 + - - 3 + - 4437.87 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 6784 + - - 3 + - 4338.36 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1408 + - - 3 + - 3827.09 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 448 + - - 1 + - 3028.48 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 256 + - 64 + - - 6 + - 2.16149 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1024 + - - 0 + - 638.116 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 1 + - 1341.46 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1856 + - - 1 + - 3411.8 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1024 + - - 0 + - 2910.08 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 3584 + - - 3 + - 4178.57 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 256 + - - 5 + - 332.227 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 448 + - - 4 + - 2810.12 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 3584 + - - 6 + - 123.305 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 2944 + - - 3 + - 4444.42 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1408 + - - 2 + - 3620.41 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 2944 + - - 3 + - 4076.08 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 64 + - - 1 + - 2116.94 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 6784 + - - 3 + - 4328.78 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 768 + - 4288 + - - 1 + - 1858.11 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 2944 + - - 3 + - 3991.41 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 2368 + - - 1 + - 3708.14 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 128 + - - 1 + - 2245.11 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1024 + - - 3 + - 2700.83 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 5888 + - - 3 + - 4276.37 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 2368 + - - 3 + - 3016.98 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1856 + - - 3 + - 3731.14 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 448 + - - 1 + - 2661.12 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 4 + - - 7 + - 85.9565 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1408 + - - 1 + - 3733.82 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 5056 + - - 3 + - 4364.35 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 2368 + - - 1 + - 2735.93 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 128 + - - 5 + - 166.376 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 64 + - - 1 + - 1375.05 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 448 + - - 0 + - 1994.96 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 448 + - - 1 + - 3443.81 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 768 + - 2944 + - - 0 + - 1573.23 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 5888 + - - 3 + - 4441.27 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 128 + - - 0 + - 2617.79 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 448 + - - 1 + - 3156.3 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 6784 + - - 3 + - 4531.67 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 3 + - 2830.44 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 6784 + - - 4 + - 4117.82 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 3584 + - - 3 + - 4293.3 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1408 + - - 3 + - 3546.49 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 64 + - - 1 + - 2763.14 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 4288 + - - 3 + - 4133.48 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 4288 + - - 1 + - 2202.56 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 256 + - - 1 + - 3292.65 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 5056 + - - 1 + - 3501.38 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 128 + - - 0 + - 1720.96 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 4288 + - - 1 + - 2042.56 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 64 + - - 5 + - 166.351 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 448 + - - 1 + - 3241.75 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1408 + - - 3 + - 4351.92 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3584 + - - 3 + - 4394.14 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 5888 + - - 3 + - 3308.3 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 2944 + - - 3 + - 4068.2 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 768 + - 4288 + - - 3 + - 4005.9 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 4 + - - 7 + - 136.649 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 256 + - - 3 + - 3829.56 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 448 + - - 1 + - 3166.23 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1856 + - - 1 + - 3624.69 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1856 + - - 3 + - 4288.33 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 768 + - 64 + - - 5 + - 150.841 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 768 + - 448 + - - 5 + - 519.604 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 6 + - 8.79919 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 6784 + - - 3 + - 4298.42 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 6784 + - - 1 + - 3202.64 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 64 + - - 1 + - 1403.59 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 2944 + - - 3 + - 4116.11 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1408 + - - 3 + - 3711.2 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 4 + - - 6 + - 11.2377 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 768 + - 704 + - - 5 + - 410.612 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 3584 + - - 3 + - 4387.93 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 5056 + - - 3 + - 4199.27 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1408 + - - 3 + - 3994.37 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1856 + - - 3 + - 3151.49 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 256 + - - 0 + - 1795.36 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 768 + - 4288 + - - 1 + - 3254.01 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 3 + - 3261.16 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 704 + - - 3 + - 3820.11 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 128 + - - 5 + - 162.165 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1856 + - - 1 + - 2355.49 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 448 + - - 5 + - 579.608 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 5056 + - - 3 + - 4326.41 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 5888 + - - 1 + - 2832.47 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 2944 + - - 3 + - 3752.01 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 64 + - - 1 + - 1853.75 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 704 + - - 0 + - 2894.85 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 5888 + - - 3 + - 3967.7 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 256 + - 2368 + - - 3 + - 3043.14 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 5888 + - - 3 + - 4472.33 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 768 + - 704 + - - 1 + - 1556.73 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3584 + - - 0 + - 2208.54 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1408 + - - 1 + - 1822.75 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1408 + - - 1 + - 3222.35 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 4 + - - 6 + - 67.8188 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 4288 + - - 6 + - 137.86 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 256 + - 5056 + - - 6 + - 131.077 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 2944 + - - 6 + - 103.457 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1408 + - - 1 + - 1530.75 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 768 + - 5888 + - - 3 + - 3654.22 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1408 + - - 3 + - 3917.14 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1024 + - - 3 + - 3870.36 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 768 + - 256 + - - 5 + - 300.452 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 448 + - - 1 + - 3564.29 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1408 + - - 3 + - 3759.39 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 5056 + - - 3 + - 4285.16 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3584 + - - 3 + - 4206.14 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1408 + - - 3 + - 3819.55 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 6784 + - - 3 + - 4324.94 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 768 + - 704 + - - 1 + - 2135.64 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 5056 + - - 2 + - 4053.83 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 768 + - 2944 + - - 1 + - 3131.01 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 2944 + - - 1 + - 3257.82 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1856 + - - 3 + - 4110.16 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 128 + - - 1 + - 2858.72 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 5888 + - - 3 + - 4275.95 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 256 + - 4288 + - - 1 + - 1406.59 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3584 + - - 6 + - 127.765 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 3584 + - - 3 + - 4345.22 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 768 + - 64 + - - 6 + - 2.65114 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 448 + - - 4 + - 3319.44 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 256 + - 4288 + - - 7 + - 117.968 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 64 + - - 5 + - 290.76 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 768 + - 4 + - - 6 + - 28.0045 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3584 + - - 3 + - 4403.41 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 64 + - - 5 + - 41.3845 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 256 + - - 1 + - 1119.3 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 768 + - 6784 + - - 1 + - 3021.96 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 448 + - - 1 + - 2768.48 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 2944 + - - 1 + - 2893.54 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 704 + - - 3 + - 3722.59 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1856 + - - 3 + - 3831.57 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1856 + - - 7 + - 51.5633 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 6784 + - - 3 + - 4494.2 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 4288 + - - 3 + - 4388.73 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1856 + - - 3 + - 3932.71 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 3584 + - - 3 + - 3716.55 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1856 + - - 6 + - 66.9334 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 2368 + - - 0 + - 1512.88 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 4 + - - 7 + - 87.2041 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 768 + - 4288 + - - 1 + - 2672.27 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 64 + - - 1 + - 2176.07 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 768 + - 4 + - - 6 + - 18.4202 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1856 + - - 3 + - 3773.76 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 2368 + - - 3 + - 4150.48 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 256 + - 2368 + - - 1 + - 2298.21 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 2944 + - - 3 + - 4395.25 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 448 + - - 1 + - 3502.67 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 768 + - 448 + - - 1 + - 1026.23 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 64 + - - 0 + - 1192.75 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 6784 + - - 3 + - 4457.05 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 1 + - 462.199 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 5056 + - - 3 + - 4343.29 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1024 + - - 3 + - 3181.8 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 2368 + - - 0 + - 1454.32 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1024 + - - 0 + - 2097.66 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1024 + - - 3 + - 3544.83 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 64 + - - 5 + - 443.72 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 256 + - 3584 + - - 1 + - 2193.89 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 128 + - - 1 + - 1884.75 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1408 + - - 1 + - 3090.16 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 4 + - - 6 + - 2.79002 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 6784 + - - 3 + - 4277.7 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 5888 + - - 4 + - 3893.72 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 3584 + - - 3 + - 4350.85 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 128 + - - 1 + - 83.1338 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 704 + - - 4 + - 3919.43 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 64 + - - 1 + - 1177.29 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 1829.26 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1024 + - - 1 + - 860.077 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 5056 + - - 3 + - 4298.08 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 2368 + - - 6 + - 86.665 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 768 + - 64 + - - 5 + - 262.711 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 768 + - 704 + - - 1 + - 810.047 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 2944 + - - 3 + - 3957.59 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 128 + - - 1 + - 2439.91 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 2368 + - - 3 + - 3796.22 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 4 + - - 7 + - 171.703 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1856 + - - 3 + - 4022.8 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 5056 + - - 2 + - 4356.06 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1408 + - - 0 + - 874.976 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1856 + - - 3 + - 3945.17 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1024 + - - 0 + - 658.675 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 128 + - - 1 + - 2668.23 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1856 + - - 1 + - 3343.48 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 768 + - 3584 + - - 1 + - 2936.54 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1856 + - - 3 + - 3835.13 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3584 + - - 3 + - 4468.64 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 2944 + - - 6 + - 100.161 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1024 + - - 1 + - 2994.03 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 3584 + - - 3 + - 3860.0 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 256 + - - 5 + - 166.319 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 4288 + - - 3 + - 4320.23 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 2944 + - - 3 + - 4247.47 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 2944 + - - 2 + - 4252.54 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 6784 + - - 3 + - 4377.01 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 64 + - - 5 + - 640.287 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 768 + - 2368 + - - 0 + - 2243.37 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 448 + - - 3 + - 3483.07 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 256 + - 4288 + - - 3 + - 2916.79 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 3584 + - - 3 + - 3779.32 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 64 + - - 5 + - 588.133 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 5888 + - - 3 + - 4328.28 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1408 + - - 0 + - 1898.88 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 5888 + - - 3 + - 3826.4 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 2944 + - - 3 + - 4227.63 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 5056 + - - 0 + - 2480.79 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 2944 + - - 2 + - 3975.22 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1856 + - - 4 + - 4057.56 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 768 + - 128 + - - 5 + - 519.375 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1024 + - - 2 + - 3962.33 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 64 + - - 1 + - 814.054 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 448 + - - 6 + - 19.4174 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1024 + - - 1 + - 1988.33 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 5056 + - - 3 + - 4421.63 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 2944 + - - 3 + - 4185.69 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 704 + - - 1 + - 1143.07 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 6784 + - - 3 + - 3525.45 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 4 + - - 7 + - 147.386 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 768 + - 4 + - - 6 + - 5.32911 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 4288 + - - 3 + - 3757.16 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 6784 + - - 3 + - 4523.58 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 5056 + - - 3 + - 4171.11 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 128 + - - 1 + - 2254.56 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 2538.43 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 2368 + - - 3 + - 3912.09 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 256 + - - 5 + - 323.388 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 256 + - - 1 + - 3485.72 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 4288 + - - 3 + - 3929.0 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1408 + - - 1 + - 2787.95 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 128 + - - 0 + - 2244.3 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1024 + - - 0 + - 2396.86 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 2368 + - - 3 + - 3953.51 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1024 + - - 0 + - 2627.88 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 5056 + - - 3 + - 3717.74 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1856 + - - 1 + - 3142.24 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 2368 + - - 3 + - 3933.76 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 2944 + - - 1 + - 2790.8 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1408 + - - 3 + - 3307.07 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1856 + - - 3 + - 4151.1 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 2368 + - - 2 + - 3584.62 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 256 + - 5888 + - - 1 + - 2124.12 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 768 + - 448 + - - 5 + - 262.929 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 2368 + - - 3 + - 4188.53 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 6784 + - - 6 + - 210.086 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 448 + - - 4 + - 2939.18 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 128 + - - 1 + - 3058.55 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 4288 + - - 3 + - 4275.42 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 4288 + - - 3 + - 3787.32 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 5888 + - - 3 + - 4190.97 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 64 + - - 0 + - 1458.48 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 2944 + - - 3 + - 4432.94 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 704 + - - 1 + - 2579.92 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 768 + - 128 + - - 5 + - 151.353 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 6784 + - - 3 + - 3863.1 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 4288 + - - 3 + - 4337.39 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 768 + - 5888 + - - 1 + - 2668.49 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 256 + - 2368 + - - 1 + - 1547.44 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 2368 + - - 3 + - 3829.39 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 2368 + - - 2 + - 3727.92 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 5888 + - - 3 + - 4491.96 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1408 + - - 0 + - 1713.46 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 704 + - - 1 + - 2741.28 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 704 + - - 1 + - 3290.97 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 6784 + - - 3 + - 4281.9 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 256 + - 704 + - - 6 + - 20.9726 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 256 + - - 1 + - 3034.19 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 64 + - - 1 + - 2130.71 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1024 + - - 4 + - 3574.77 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 768 + - 64 + - - 5 + - 75.3625 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 704 + - - 1 + - 2115.46 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1024 + - - 3 + - 3061.58 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 5056 + - - 3 + - 3957.03 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 256 + - - 3 + - 3198.62 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 64 + - - 5 + - 454.192 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 256 + - 4 + - - 6 + - 4.40748 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 4 + - - 7 + - 153.371 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 128 + - - 0 + - 2554.01 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 768 + - 5056 + - - 6 + - 149.939 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 704 + - - 4 + - 3338.07 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 704 + - - 0 + - 906.525 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1408 + - - 6 + - 50.5587 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 5888 + - - 3 + - 4391.69 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 448 + - - 1 + - 3469.17 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 256 + - 5056 + - - 3 + - 2998.05 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 256 + - 704 + - - 5 + - 326.05 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1408 + - - 3 + - 3846.83 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 6784 + - - 3 + - 3914.34 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 4288 + - - 3 + - 4135.85 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1408 + - - 6 + - 39.3504 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1024 + - - 0 + - 2563.4 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 2944 + - - 3 + - 4435.01 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 64 + - - 0 + - 1315.78 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 6784 + - - 3 + - 4473.26 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 768 + - 5888 + - - 3 + - 3890.44 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1024 + - - 2 + - 3016.04 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 5056 + - - 3 + - 3962.72 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 128 + - - 5 + - 322.658 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 448 + - - 0 + - 1912.01 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 2368 + - - 3 + - 4017.84 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 5056 + - - 3 + - 3390.77 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1024 + - - 4 + - 3703.29 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 120.785 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 4288 + - - 3 + - 3948.44 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 2368 + - - 1 + - 3792.34 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3584 + - - 2 + - 4387.38 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 5888 + - - 1 + - 3643.62 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 64 + - - 1 + - 3299.67 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1856 + - - 3 + - 3588.19 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 5888 + - - 3 + - 4078.45 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 448 + - - 4 + - 3371.57 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 2944 + - - 3 + - 4360.64 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 4288 + - - 3 + - 4392.06 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1408 + - - 3 + - 4222.71 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 128 + - - 1 + - 2335.25 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 4 + - - 7 + - 69.5323 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 448 + - - 1 + - 2604.29 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1024 + - - 1 + - 1777.67 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 2368 + - - 3 + - 3944.55 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 2368 + - - 3 + - 3717.36 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 128 + - - 1 + - 2000.46 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3584 + - - 2 + - 4134.9 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 256 + - 704 + - - 1 + - 1607.26 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 128 + - - 0 + - 1794.73 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 4288 + - - 3 + - 3891.31 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1024 + - - 6 + - 37.5085 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 5888 + - - 3 + - 4452.59 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1408 + - - 0 + - 1787.18 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 5888 + - - 3 + - 4399.47 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 2368 + - - 3 + - 4136.05 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 256 + - - 3 + - 3369.85 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 5888 + - - 1 + - 2940.16 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 2368 + - - 3 + - 4231.33 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 4288 + - - 3 + - 4028.84 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 5056 + - - 3 + - 4216.8 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 704 + - - 4 + - 3892.0 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 4 + - - 7 + - 38.3811 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1856 + - - 0 + - 1040.26 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 2944 + - - 1 + - 3366.31 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 128 + - - 1 + - 2145.79 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 4 + - - 7 + - 102.605 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 768 + - 128 + - - 1 + - 810.35 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 4 + - - 6 + - 18.9098 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 6784 + - - 3 + - 4352.76 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1024 + - - 2 + - 4065.99 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 4 + - - 7 + - 77.9339 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 3584 + - - 3 + - 4095.15 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1408 + - - 1 + - 622.088 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 2368 + - - 0 + - 2457.6 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1408 + - - 1 + - 2750.56 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 256 + - - 1 + - 2935.6 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1408 + - - 3 + - 3960.42 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4288 + - - 1 + - 2239.41 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 2944 + - - 1 + - 3643.5 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1856 + - - 1 + - 3158.62 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 768 + - 2368 + - - 6 + - 79.264 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 5888 + - - 3 + - 4031.4 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 4 + - - 6 + - 130.742 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 256 + - 448 + - - 5 + - 409.783 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 4288 + - - 3 + - 4343.32 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 6784 + - - 3 + - 4176.74 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 2944 + - - 1 + - 2866.03 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1408 + - - 3 + - 3994.72 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 5056 + - - 0 + - 2027.3 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1024 + - - 0 + - 1307.58 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5888 + - - 3 + - 2800.1 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1408 + - - 3 + - 4045.44 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 5056 + - - 3 + - 4350.88 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 256 + - 2368 + - - 6 + - 66.1994 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 5888 + - - 3 + - 4429.75 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 704 + - - 1 + - 2347.83 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 4 + - - 7 + - 122.606 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 128 + - - 1 + - 3461.28 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1408 + - - 3 + - 3862.9 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 6784 + - - 3 + - 4314.95 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 1 + - 1820.64 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5056 + - - 1 + - 2554.51 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 256 + - 128 + - - 5 + - 121.72 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 128 + - - 1 + - 2526.01 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1856 + - - 3 + - 3500.14 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 768 + - 2944 + - - 6 + - 94.8458 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1024 + - - 6 + - 36.9641 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 5888 + - - 3 + - 4039.62 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1024 + - - 2 + - 3926.58 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 448 + - - 1 + - 3360.46 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 448 + - - 1 + - 3478.69 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 5056 + - - 3 + - 4168.09 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1408 + - - 0 + - 2497.16 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1024 + - - 1 + - 1348.94 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1024 + - - 0 + - 1267.05 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 256 + - 2944 + - - 1 + - 1897.6 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 256 + - - 3 + - 3324.55 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 128 + - - 1 + - 1431.49 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 256 + - 64 + - - 5 + - 209.508 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1024 + - - 2 + - 3402.08 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 4288 + - - 3 + - 4204.7 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 704 + - - 1 + - 3430.74 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 4288 + - - 3 + - 4275.31 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 256 + - - 0 + - 2715.65 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 4288 + - - 1 + - 2118.98 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 768 + - 3584 + - - 1 + - 3201.68 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1024 + - - 4 + - 3678.2 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 704 + - - 1 + - 2198.16 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 768 + - 704 + - - 1 + - 2032.08 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 5056 + - - 6 + - 167.361 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 3584 + - - 3 + - 4009.87 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 3584 + - - 3 + - 3550.13 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 4 + - - 6 + - 93.1657 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 64 + - - 1 + - 625.778 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 768 + - 256 + - - 5 + - 150.85 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 768 + - 6784 + - - 1 + - 2876.53 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 128 + - - 0 + - 2172.08 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 5888 + - - 3 + - 4365.81 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 704 + - - 1 + - 3414.8 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 5056 + - - 3 + - 4415.58 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 1 + - 2364.45 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 2368 + - - 1 + - 2334.79 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1856 + - - 3 + - 3915.17 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 5 + - 121.476 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1856 + - - 3 + - 3821.16 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 4 + - - 7 + - 110.438 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 256 + - 448 + - - 6 + - 14.6836 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 768 + - 5056 + - - 0 + - 2318.79 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 2368 + - - 3 + - 4253.26 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1408 + - - 3 + - 3893.27 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 704 + - - 2 + - 3972.1 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 3584 + - - 3 + - 4183.15 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1408 + - - 3 + - 3374.27 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1024 + - - 3 + - 3582.47 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1024 + - - 6 + - 28.1635 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1856 + - - 2 + - 3685.44 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 768 + - 2944 + - - 1 + - 2521.2 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 64 + - - 5 + - 457.361 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 2944 + - - 1 + - 3446.67 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 704 + - - 3 + - 3157.7 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 2368 + - - 3 + - 3922.4 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 448 + - - 3 + - 3285.84 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 448 + - - 0 + - 2552.36 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 256 + - 448 + - - 1 + - 1607.61 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 2368 + - - 3 + - 3584.07 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 4 + - - 6 + - 112.526 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 256 + - - 3 + - 2789.89 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 128 + - - 5 + - 241.237 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1024 + - - 3 + - 4244.32 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1408 + - - 3 + - 3673.84 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 704 + - - 1 + - 3131.21 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 4288 + - - 3 + - 4299.61 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 4 + - - 6 + - 54.0926 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1408 + - - 3 + - 4009.11 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 256 + - 2368 + - - 1 + - 995.008 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 256 + - 2944 + - - 6 + - 82.0988 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 6784 + - - 3 + - 4500.49 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1408 + - - 3 + - 2733.34 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 2368 + - - 3 + - 4265.14 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 1 + - 785.758 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1024 + - - 2 + - 4140.24 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 5888 + - - 3 + - 4052.4 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 6784 + - - 3 + - 4216.63 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 5056 + - - 1 + - 3308.61 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 4 + - - 7 + - 65.9487 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 768 + - 256 + - - 6 + - 10.6099 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 4 + - - 6 + - 0.175665 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 6784 + - - 3 + - 4508.17 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 448 + - - 4 + - 3847.66 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3584 + - - 1 + - 3566.32 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 256 + - - 1 + - 2856.33 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 768 + - 5056 + - - 2 + - 3796.24 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 6784 + - - 3 + - 4471.32 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 3584 + - - 3 + - 3822.56 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 4288 + - - 3 + - 3517.63 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 256 + - 4 + - - 6 + - 14.8355 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 5888 + - - 3 + - 4233.28 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 6784 + - - 3 + - 4521.13 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 4288 + - - 1 + - 2150.33 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 4288 + - - 1 + - 2825.53 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3584 + - - 3 + - 4209.29 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 2944 + - - 3 + - 4400.3 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 3584 + - - 3 + - 4403.99 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1408 + - - 3 + - 3640.71 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 768 + - 4 + - - 6 + - 10.6451 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 6784 + - - 1 + - 3379.92 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 128 + - - 0 + - 1265.85 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 4 + - - 6 + - 28.0971 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 2368 + - - 3 + - 4151.86 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 4 + - - 7 + - 88.5794 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1856 + - - 3 + - 4097.83 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1856 + - - 1 + - 2585.67 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 5056 + - - 3 + - 3928.11 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 5056 + - - 1 + - 3569.57 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 704 + - - 3 + - 2734.12 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1856 + - - 3 + - 4173.45 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 704 + - - 1 + - 3141.82 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1856 + - - 1 + - 3241.0 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 64 + - - 1 + - 992.157 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 256 + - 5888 + - - 1 + - 1851.0 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 256 + - 2944 + - - 1 + - 1177.91 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 64 + - - 0 + - 1901.56 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 6784 + - - 2 + - 3392.09 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1024 + - - 2 + - 3503.26 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 128 + - - 5 + - 81.121 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 128 + - - 1 + - 1543.66 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 5056 + - - 3 + - 4296.26 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 448 + - - 1 + - 3362.71 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1408 + - - 3 + - 4292.51 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1024 + - - 4 + - 3596.07 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 3584 + - - 3 + - 3841.89 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 768 + - 64 + - - 5 + - 411.106 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1856 + - - 1 + - 1928.73 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 2944 + - - 3 + - 3909.92 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 256 + - - 0 + - 2398.7 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 5056 + - - 3 + - 4365.58 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 128 + - - 5 + - 332.335 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 2368 + - - 3 + - 3861.85 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 768 + - 3584 + - - 0 + - 1809.28 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 256 + - 5056 + - - 3 + - 3416.57 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 256 + - 6784 + - - 3 + - 3932.03 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1856 + - - 3 + - 4231.93 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 256 + - 128 + - - 5 + - 409.052 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1856 + - - 3 + - 4117.65 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 256 + - - 1 + - 3617.52 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1856 + - - 1 + - 3144.43 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 768 + - 448 + - - 6 + - 18.1636 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 4288 + - - 3 + - 4207.4 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 1 + - 1145.19 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 256 + - - 1 + - 2422.28 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1856 + - - 3 + - 4044.97 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 6784 + - - 3 + - 4384.84 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 704 + - - 0 + - 2803.55 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 4288 + - - 1 + - 3677.55 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 4 + - - 6 + - 39.5061 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 5888 + - - 2 + - 4163.12 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 704 + - - 3 + - 3482.29 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 768 + - 6784 + - - 6 + - 193.206 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 256 + - - 1 + - 3395.77 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1408 + - - 0 + - 800.749 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 448 + - - 1 + - 3295.06 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 128 + - - 6 + - 5.72624 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 256 + - - 1 + - 643.054 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1024 + - - 4 + - 3307.55 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1856 + - - 3 + - 3282.0 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 2368 + - - 3 + - 4270.52 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1408 + - - 1 + - 2767.25 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 256 + - 2944 + - - 1 + - 2606.98 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 256 + - 5888 + - - 3 + - 3446.58 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 4 + - - 6 + - 39.9493 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4 + - - 6 + - 8.77248 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1024 + - - 4 + - 3119.75 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 5056 + - - 2 + - 4032.02 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 64 + - - 1 + - 39.961 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 2944 + - - 3 + - 4238.23 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 256 + - - 0 + - 2775.93 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 704 + - - 1 + - 2149.6 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 256 + - 448 + - - 5 + - 210.534 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 5888 + - - 3 + - 4055.65 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 128 + - - 1 + - 873.935 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 64 + - - 1 + - 2872.57 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 6784 + - - 3 + - 4483.32 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 2944 + - - 3 + - 4168.08 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 256 + - 128 + - - 1 + - 626.594 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 448 + - - 1 + - 3491.63 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 128 + - - 1 + - 1556.73 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 1 + - 2299.97 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 64 + - - 0 + - 876.647 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 64 + - - 5 + - 162.065 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1408 + - - 2 + - 3741.83 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 4 + - - 7 + - 67.6235 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1024 + - - 4 + - 3501.02 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 768 + - 6784 + - - 1 + - 3267.87 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 2944 + - - 3 + - 4145.54 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 5888 + - - 3 + - 3691.65 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 5888 + - - 3 + - 4174.5 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 256 + - - 0 + - 661.359 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1024 + - - 4 + - 3596.78 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2368 + - - 0 + - 1826.5 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 704 + - - 3 + - 3672.47 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 64 + - - 0 + - 657.616 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 2368 + - - 3 + - 4333.14 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 128 + - - 0 + - 1934.13 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 256 + - - 1 + - 3146.6 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 4288 + - - 3 + - 3830.79 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 64 + - - 1 + - 2395.97 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 4288 + - - 3 + - 3796.72 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1024 + - - 1 + - 3366.99 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 5056 + - - 0 + - 2579.78 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1408 + - - 6 + - 51.6518 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 4288 + - - 3 + - 4303.75 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 64 + - - 1 + - 83.2651 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 256 + - - 6 + - 11.3623 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1408 + - - 3 + - 3555.33 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 4 + - - 7 + - 53.5578 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 4288 + - - 1 + - 3437.27 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 704 + - - 4 + - 3809.03 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 4288 + - - 3 + - 4090.86 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1024 + - - 5 + - 589.015 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 2944 + - - 3 + - 4349.15 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3584 + - - 1 + - 3384.32 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 448 + - - 0 + - 2488.74 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 2368 + - - 0 + - 2397.18 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 448 + - - 1 + - 2344.82 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 2944 + - - 0 + - 1780.56 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 2944 + - - 3 + - 4267.95 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 3584 + - - 3 + - 4227.78 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 768 + - 5888 + - - 3 + - 3191.33 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 256 + - - 0 + - 1723.41 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3584 + - - 3 + - 4307.98 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1024 + - - 3 + - 3294.33 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 5888 + - - 3 + - 4126.79 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 448 + - - 1 + - 2346.21 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 768 + - 256 + - - 1 + - 1557.66 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 704 + - - 1 + - 2782.66 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 4 + - - 6 + - 53.2666 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 2368 + - - 3 + - 3829.36 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1408 + - - 1 + - 3651.59 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1024 + - - 1 + - 3223.15 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 2368 + - - 2 + - 3969.34 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1856 + - - 3 + - 3811.57 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 256 + - 448 + - - 1 + - 1241.79 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 448 + - - 1 + - 3315.74 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 256 + - 128 + - - 5 + - 60.2908 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 2368 + - - 3 + - 4255.72 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 448 + - - 1 + - 789.93 +- null diff --git a/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml b/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml new file mode 100644 index 000000000..a63116aa8 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml @@ -0,0 +1,12161 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 64 + LVCA: 8 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x128x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 32 + LVCA: 4 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x32x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 6 + - 2954.59 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 4 + - 4025.85 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 116.076 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 1 + - 845.171 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1972.31 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 2480.72 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 59.9816 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4257.57 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 3 + - 3289.8 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3303.91 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 1484.0 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3705.47 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 1238.89 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 5 + - 2209.44 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 3 + - 4001.8 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 7 + - 13.0749 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3907.7 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 74.4445 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 3 + - 4282.36 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 8 + - 120.803 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 3782.03 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 2976.19 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3847.68 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4112.42 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 6 + - 3046.15 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 449.449 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 62.3904 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 7 + - 3.39824 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 2200.75 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 3516.69 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4032.95 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 0 + - 3915.86 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 3413.62 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 2585.53 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 2676.32 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 6 + - 2610.68 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 5 + - 2760.48 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 7 + - 104.231 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 47.383 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 4 + - 3924.37 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 1289.67 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 3 + - 4057.1 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 3 + - 3225.34 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 0 + - 3503.28 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 4 + - 3301.1 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 0 + - 3759.95 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 4 + - 3445.79 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 4 + - 3442.49 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 6 + - 2882.31 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 4 + - 3759.15 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2018.01 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 8 + - 219.812 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 0 + - 3566.71 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3912.43 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 6 + - 2935.45 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 0 + - 3457.56 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 1594.49 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 5 + - 2992.89 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 3768.5 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 197.778 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 5 + - 2634.93 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 3 + - 3751.81 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 5 + - 2059.72 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4168.66 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 4 + - 3866.16 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 153.45 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 3 + - 4119.58 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 3268.41 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 5 + - 1929.12 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 4 + - 3553.24 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 6 + - 2971.75 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3894.12 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 6 + - 2896.24 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 5 + - 1313.5 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 5 + - 1682.69 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 1 + - 1860.07 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 2829.95 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 7 + - 85.9574 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 5 + - 1724.63 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 4 + - 3608.87 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2951.84 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 4 + - 3544.32 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3394.21 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 6 + - 2647.22 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 5 + - 2117.2 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 3077.93 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 3537.99 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 2.47794 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 3350.62 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 6 + - 2769.06 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2611.65 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3931.4 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 0 + - 3628.16 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 3.34032 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 1656.91 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 2845.71 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 45.7854 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 0 + - 3748.16 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4145.64 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 1867.3 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 0 + - 3791.39 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 504.215 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 3949.4 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 4 + - 3507.09 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 0.189148 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 0 + - 3491.21 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 3 + - 3243.14 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 3055.67 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 3974.1 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 6 + - 2313.73 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 2892.91 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3394.58 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 3161.19 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 94.5694 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 4 + - 3700.44 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 7 + - 47.3194 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 3 + - 4032.43 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 614.494 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 4 + - 3945.16 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 4 + - 3369.2 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3002.56 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 199.873 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3803.42 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 2333.84 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4137.48 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 3 + - 3794.16 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 137.801 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 3308.23 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 3306.04 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 2 + - 379.582 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 47.0106 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 3572.96 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 5 + - 1920.96 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3979.16 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4245.44 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 4 + - 3591.76 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3685.82 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 3 + - 4128.27 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3899.64 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 185.705 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 1542.23 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 2016.49 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 6 + - 3361.14 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 1730.08 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 3 + - 3968.13 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 1539.55 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3928.83 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 1477.08 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3802.97 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 3 + - 4251.2 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 7 + - 3.29931 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3234.49 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 399.61 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 3310.51 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 1 + - 1127.07 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 1229.4 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 5 + - 2483.92 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 4 + - 3449.25 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 44.6838 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 3 + - 3532.17 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 0 + - 3602.91 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 2 + - 557.951 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 2082.54 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 5 + - 2898.46 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3850.44 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 7 + - 56.5909 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 3 + - 3687.44 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3784.63 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2202.49 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 3 + - 3929.59 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 6 + - 2959.0 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 1213.31 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 3777.43 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3763.48 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 6 + - 3171.29 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 5 + - 1415.27 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 4 + - 4063.84 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1867.92 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 4 + - 2891.71 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4202.4 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 225.483 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 5 + - 1394.04 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3333.63 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 2 + - 258.161 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 3 + - 3878.62 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 0 + - 3495.89 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 3232.17 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1211.2 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 5 + - 1864.66 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 889.455 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 2540.22 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 2 + - 1213.26 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 3 + - 3415.1 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 1897.22 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3978.16 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 3 + - 3401.08 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 3971.91 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 3864.17 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 2 + - 1451.96 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 6 + - 2650.71 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 99.9024 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 536.026 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 3109.53 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 6 + - 3308.31 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 1632.02 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 3 + - 3452.57 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3642.52 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 2 + - 676.958 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3733.15 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 7 + - 42.4366 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 2 + - 1259.44 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 3578.36 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 7 + - 22.8941 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 3558.79 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3002.15 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2917.45 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 8 + - 76.6595 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 716.596 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 2 + - 434.321 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 23.5363 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 3 + - 3388.29 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4134.75 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 4 + - 3280.21 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 6 + - 2935.68 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 7 + - 66.36 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 1157.14 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 7 + - 6.74141 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2026.28 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 1 + - 2568.07 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 4 + - 3872.69 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 126.041 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 4074.29 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3320.38 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 0 + - 3955.26 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 2444.39 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2966.8 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 860.967 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4177.86 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 6 + - 2883.97 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 5 + - 2109.4 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 2356.82 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 7 + - 158.154 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 5 + - 3018.65 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 2 + - 345.417 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 1022.14 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 880.153 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 2 + - 1605.97 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 0 + - 3659.17 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 7 + - 13.429 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 2351.72 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 3985.1 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 1868.76 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 3240.85 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4121.05 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3714.4 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 64.5789 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 2793.34 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 4 + - 3457.72 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 3307.29 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 2 + - 854.784 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 3 + - 3676.24 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 2059.89 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 5 + - 2163.63 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 6 + - 3219.27 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 2405.82 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3520.4 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 679.353 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 0 + - 3815.12 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 4022.07 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 108.933 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 1 + - 1140.96 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 7 + - 4.88687 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 3431.58 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3291.2 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 6 + - 3216.38 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 4 + - 3500.9 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3963.31 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 1937.87 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 2 + - 884.522 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 1 + - 2568.63 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 3523.17 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 4 + - 3557.97 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 4 + - 3019.04 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 6.25454 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 5 + - 2023.96 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 2081.99 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 53.8336 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1459.06 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4235.25 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 5 + - 1552.34 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1754.44 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 3832.67 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 5 + - 2774.48 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2506.29 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3983.94 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 6 + - 2049.01 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 12.4363 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 4035.24 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 8 + - 112.578 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 0 + - 3777.6 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 2 + - 615.139 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 5 + - 1469.36 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 3 + - 4162.26 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 4 + - 3807.08 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 150.802 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3953.73 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 2656.61 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 7 + - 43.1504 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3456.13 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 1330.25 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 3533.04 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3989.01 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 4 + - 3759.93 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 0 + - 3955.47 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 3260.15 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 2931.91 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3314.05 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 6 + - 1663.64 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 0 + - 3366.61 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 0 + - 3901.83 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3825.48 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 300.222 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 0 + - 3463.15 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3917.56 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 0 + - 2894.32 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 5 + - 2950.38 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 72.7336 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4171.16 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 2471.0 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 3945.03 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3515.58 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 4 + - 3370.12 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 3 + - 3434.27 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3858.55 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 2561.33 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 2379.07 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 5 + - 2854.89 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 7 + - 93.9893 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3518.31 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 7 + - 60.5684 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 3884.63 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 4324.6 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 7 + - 31.2047 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 1674.28 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 2 + - 1016.78 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 1599.11 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 0 + - 3444.48 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 3 + - 4132.45 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 2 + - 1257.43 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 3 + - 3214.23 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 56.7984 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 3077.58 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 6 + - 2772.91 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 5 + - 2591.06 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 2 + - 536.558 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 4 + - 3915.26 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 3.41876 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3252.95 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3888.51 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3946.23 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 5 + - 2524.57 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 7 + - 2.48897 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 4 + - 3734.78 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 1 + - 3040.71 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4119.12 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 3 + - 4012.64 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4151.1 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 753.022 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 4025.26 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 710.826 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 3292.4 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 1494.64 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2649.35 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 0 + - 3389.44 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4259.43 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 1960.4 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 108.675 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 2 + - 1154.88 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 5 + - 1281.64 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 6 + - 2264.13 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4108.75 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 0 + - 3627.7 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3763.17 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 7 + - 72.78 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 3114.58 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 3923.11 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 2880.72 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 6 + - 2684.96 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1108.79 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 3 + - 3036.86 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3979.84 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 5 + - 2082.23 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 0 + - 3280.2 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 6.60929 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 4024.75 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3940.16 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3272.78 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 4026.52 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 1015.51 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 5 + - 3003.32 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 5 + - 2609.94 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3803.62 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 3 + - 3782.58 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 2308.14 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2907.82 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4216.97 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4040.01 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 3322.98 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3207.4 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 7 + - 99.1004 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 0.205247 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 3 + - 3970.49 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 7 + - 76.7561 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1382.88 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 3785.46 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 2 + - 593.586 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 7 + - 82.4428 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 4014.26 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 0.147297 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 4 + - 3732.83 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 1 + - 1710.7 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 3 + - 3960.69 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3955.15 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 2241.05 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 6 + - 3275.56 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 9.95386 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 2 + - 717.905 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 5 + - 1217.5 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 4 + - 3939.37 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 5 + - 2765.1 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 3160.15 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 3 + - 4037.76 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 2933.2 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 5 + - 1211.49 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 21.8833 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 6 + - 2966.72 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2912.42 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 6 + - 2914.8 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 5 + - 1995.58 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 108.24 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 5 + - 2322.55 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 217.221 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 5 + - 1619.33 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 4 + - 3894.97 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3867.84 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 4084.35 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 1488.61 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 2116.81 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3882.16 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 2980.45 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 7 + - 138.205 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 7 + - 6.1811 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3256.35 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 2 + - 500.457 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 5 + - 2214.22 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 140.466 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 3451.74 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 3180.68 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 2723.57 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 4 + - 3434.31 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 3 + - 3961.62 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 1 + - 1516.34 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 2204.84 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 31.6601 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 7 + - 103.546 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3802.0 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 4 + - 3844.41 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 2508.24 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4091.78 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 1 + - 1108.79 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 2097.85 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 0 + - 3608.38 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3494.14 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 7 + - 65.54 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 0 + - 3767.59 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 5 + - 1153.71 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3941.89 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3756.48 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 3 + - 3591.21 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 2444.08 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 3 + - 3223.06 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3734.12 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 3 + - 4139.0 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 8 + - 86.4303 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 2 + - 1945.87 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 3 + - 3928.89 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 3 + - 3418.02 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 16.6311 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4170.31 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 3048.08 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3134.49 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 2069.02 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 5 + - 952.035 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 1 + - 1578.36 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3645.8 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 5 + - 1495.33 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 1 + - 1764.85 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 3 + - 3366.48 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 8 + - 80.1206 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 2055.88 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 0 + - 3834.83 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 4011.32 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 149.863 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3404.19 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 4109.44 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 6 + - 2498.26 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 6.70746 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 69.7989 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4248.83 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 2 + - 1674.96 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 6 + - 2646.07 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 4150.71 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 3 + - 3731.23 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 3 + - 3713.5 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 4 + - 3691.7 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 2 + - 1532.18 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 162.997 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 4 + - 3803.42 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 4025.75 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 1 + - 2439.4 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 8 + - 114.954 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4252.25 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3862.28 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 3102.19 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 3214.28 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4055.76 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 3804.86 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 3 + - 3857.54 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 3 + - 3810.17 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 4 + - 3294.59 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 3 + - 4213.43 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 4151.42 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 104.221 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 782.339 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 1 + - 2243.95 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 4 + - 3843.13 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 3896.45 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 34.9587 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 0 + - 3504.68 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 3 + - 4358.78 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1295.8 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 3 + - 3553.18 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 3 + - 3844.99 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 3 + - 3526.8 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 7 + - 22.457 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 2623.53 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 7 + - 3.08332 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4016.52 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 112.535 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 0 + - 3777.84 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 5 + - 1905.07 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3698.4 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 43.2817 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 5 + - 2132.15 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 0 + - 3322.72 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 3 + - 3990.69 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 6 + - 3470.39 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 4 + - 3336.99 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 262.494 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 4 + - 3524.82 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 7 + - 20.8929 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3273.35 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 2290.86 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 4026.55 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 853.492 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 564.864 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 4 + - 3504.03 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 1937.26 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 4169.33 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 6 + - 2191.68 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3757.99 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 6 + - 2608.83 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 3197.71 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 1722.02 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 7 + - 125.372 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3619.11 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 7 + - 114.523 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 3 + - 4077.13 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 0 + - 3385.18 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 5 + - 1869.17 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 4 + - 3291.09 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 5 + - 1756.0 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 3812.85 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2214.76 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 6 + - 2976.54 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 5 + - 2481.64 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 3343.25 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 6 + - 2830.61 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 5 + - 1100.29 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 7 + - 65.1619 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 0 + - 3104.21 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 2018.85 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2060.07 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 1560.44 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 3 + - 3902.03 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3309.7 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 558.545 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 0 + - 3829.35 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 0 + - 3777.6 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 1 + - 3223.43 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2858.71 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 133.193 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 3 + - 4031.67 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 891.821 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 6 + - 2437.19 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 3.13365 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 6 + - 2900.65 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 1406.75 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 4 + - 3738.0 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 3304.99 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 215.765 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 4 + - 3898.43 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 2 + - 768.813 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 3 + - 3892.4 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 66.1967 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 1 + - 2563.12 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 3963.2 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 4 + - 3863.82 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1606.41 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 23.0616 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 5 + - 2049.52 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 7 + - 127.111 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3502.73 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 5 + - 2732.77 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 3000.67 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4122.05 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 5 + - 1994.21 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 3 + - 3866.88 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1665.22 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 3366.98 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 3597.57 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 6 + - 2658.23 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 1067.89 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 2512.74 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1943.57 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 3 + - 3528.29 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 0 + - 3564.84 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 7 + - 21.8379 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 7 + - 158.333 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1924.3 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 3 + - 4351.33 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2424.08 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 7 + - 138.197 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3343.06 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 2 + - 299.593 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2646.56 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 3131.85 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 7 + - 206.195 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 6 + - 2613.54 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 3 + - 4401.65 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 3733.95 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 3287.15 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 0 + - 3815.37 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 4 + - 3909.32 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 3 + - 3793.79 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 0 + - 3543.9 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 0 + - 3980.55 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2512.58 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 3052.26 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 2708.82 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 2908.72 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 1737.12 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 2 + - 766.876 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 4 + - 3299.07 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4032.77 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4067.76 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 6 + - 3466.62 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 2170.99 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1386.94 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 4 + - 3608.02 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3606.13 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 5 + - 1467.93 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 4059.27 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 1 + - 2296.74 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 4 + - 3785.39 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 0 + - 3701.49 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 3977.24 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 2379.08 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4102.61 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 2341.32 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 5 + - 2450.42 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 0 + - 3443.87 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 8 + - 66.1168 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 2727.52 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 4370.81 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 3797.12 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 378.866 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2701.07 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 6 + - 3351.04 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 449.32 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 4395.29 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 3 + - 3937.21 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 13.4054 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 5 + - 1791.16 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 8 + - 65.9035 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 6 + - 3172.76 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 2684.04 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 0 + - 3900.43 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2857.86 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 4 + - 3631.34 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 1687.36 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 4 + - 3783.43 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 2 + - 713.288 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 225.314 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 6 + - 3141.68 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 3001.0 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 0 + - 3973.4 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 2 + - 74.3601 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3431.86 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 101.132 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 3 + - 3963.75 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 3357.32 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 5 + - 2515.24 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 4 + - 3871.99 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 3737.94 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 5 + - 1729.74 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 4300.2 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 3 + - 3844.76 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 7 + - 29.848 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 3325.97 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 0 + - 3760.19 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 4 + - 3198.2 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 5 + - 1146.84 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 13.1003 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 5 + - 2202.94 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 4 + - 3004.89 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3112.16 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 31.887 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 3788.3 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 7 + - 182.016 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 0 + - 3758.34 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 4 + - 3605.79 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 2197.54 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 392.337 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 0 + - 3137.03 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 84.8213 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3877.88 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2484.13 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 5 + - 2510.52 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 3 + - 4100.18 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 5 + - 1807.42 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 3005.78 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 32.6355 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 6 + - 3173.73 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 2437.49 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 2934.74 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1967.37 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 0 + - 3635.13 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 5 + - 2403.67 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 2 + - 890.209 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 2648.92 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2139.22 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 3 + - 3735.88 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3943.16 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 6 + - 2871.9 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 5 + - 1837.92 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 4 + - 3908.47 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 2 + - 1212.11 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 5.09562 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 3 + - 3905.33 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 5 + - 1175.61 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 2 + - 395.457 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 6 + - 3153.54 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 5 + - 2408.47 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 4 + - 2887.5 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3775.55 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 3838.62 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1152.56 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 5 + - 1333.26 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 2 + - 1584.84 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3515.84 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3800.37 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 1946.66 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 6 + - 2884.28 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 6 + - 2503.69 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 4 + - 3457.54 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1549.72 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 2738.42 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 0 + - 3913.15 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 1758.9 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1140.69 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 7 + - 16.0478 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 6 + - 1920.85 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 149.696 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 2750.63 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 1481.63 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 6 + - 1495.86 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 2324.93 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 0 + - 4021.58 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 55.7085 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 6 + - 2659.91 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 2 + - 401.315 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 5 + - 2900.11 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 2605.0 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 7 + - 32.5243 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4132.5 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 34.1077 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 4 + - 3840.55 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 2926.91 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 90.5271 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 3455.76 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 4 + - 3949.71 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 2 + - 1156.91 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3137.52 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 2 + - 198.828 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 4 + - 3739.9 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4019.39 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 0 + - 3725.79 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 4 + - 3824.97 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 434.27 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 5 + - 1989.69 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 1698.88 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 3 + - 3780.08 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 4 + - 3444.79 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 7 + - 90.2377 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 223.971 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 3015.48 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 3 + - 3835.43 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 0 + - 2890.97 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 3940.37 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 6 + - 3004.32 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3877.45 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 0 + - 4027.68 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 6 + - 3226.99 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 3 + - 4362.06 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 1297.0 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 2 + - 153.36 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 0 + - 3910.82 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 1 + - 1888.46 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 5 + - 2150.46 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 6 + - 3355.82 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4149.16 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 6 + - 2999.52 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 7 + - 9.73118 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 2744.47 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 4 + - 3498.06 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2269.99 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 2 + - 396.054 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 7 + - 109.453 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 4034.28 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 7 + - 67.9596 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 2895.62 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 5 + - 1551.01 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1498.35 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 2914.21 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 2 + - 109.235 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 3 + - 4358.17 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 3119.82 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 5 + - 1657.55 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 3 + - 3256.66 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 3112.91 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 7 + - 33.9483 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 2 + - 112.704 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 66.5315 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 5 + - 3052.22 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 76.2308 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 1 + - 2663.87 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2933.66 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 6 + - 3280.2 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4052.64 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 2 + - 852.963 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 4082.68 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 0 + - 3564.95 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 2 + - 855.481 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 4008.36 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 0 + - 3838.1 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 3 + - 4247.41 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 4 + - 3273.85 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4387.22 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3802.95 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 4 + - 3517.16 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3263.1 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 5 + - 2467.98 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3331.87 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 4129.55 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 6 + - 2519.79 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 3041.59 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 4 + - 3148.94 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 4001.27 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 5 + - 2888.31 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 65.2708 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 3844.53 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 7 + - 176.16 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 5 + - 1420.67 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 2731.74 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 2697.6 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 7 + - 139.557 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 4 + - 2932.99 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 2671.15 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 3 + - 3951.69 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 7 + - 62.5511 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 2730.59 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 3 + - 4053.56 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 1 + - 2149.69 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 0 + - 3943.73 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 1 + - 855.631 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 3 + - 3804.87 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 5 + - 1552.23 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 0 + - 3382.74 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 4 + - 3561.34 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 1 + - 2677.42 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 5 + - 2569.11 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 3851.13 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 0 + - 3288.72 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 3 + - 3359.9 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 7 + - 6.58145 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3759.49 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 1792.92 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 3177.83 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3495.41 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 2071.18 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 5 + - 3013.89 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 0 + - 3872.27 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 6 + - 2979.62 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 3060.39 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 4 + - 3908.24 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 3381.96 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 5 + - 2025.58 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 0 + - 3276.42 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 5 + - 1673.68 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 8 + - 71.5333 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 7 + - 0.211818 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 2 + - 217.986 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 2125.93 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 2 + - 1299.37 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1791.09 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 1 + - 1112.35 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3826.11 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 5 + - 2129.68 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 7 + - 127.058 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 0 + - 4074.23 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 1 + - 2861.38 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 6 + - 2959.27 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 3 + - 3439.95 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 0 + - 4036.06 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 3181.9 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 3934.24 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 176.292 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 99.6577 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 6 + - 2933.5 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3460.7 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 1 + - 2362.88 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 5 + - 1911.27 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 2309.77 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 0 + - 3903.22 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 4 + - 3096.87 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 3 + - 4219.73 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 4 + - 3949.36 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 3 + - 4109.02 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 5 + - 1217.42 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 2 + - 1549.53 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 0 + - 3598.13 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 0 + - 3937.09 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 3 + - 3930.61 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 1 + - 1100.29 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 6 + - 3043.2 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 7 + - 163.696 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 2 + - 753.11 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 1 + - 965.94 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 3 + - 3980.24 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 764.826 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 3 + - 3975.0 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 4363.13 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 2 + - 1020.46 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 3 + - 4126.19 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 2380.28 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 0 + - 3938.53 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 2 + - 1584.13 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 592.656 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 2 + - 781.963 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 128.374 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 2901.92 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 3 + - 4134.91 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 4 + - 3872.77 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3197.89 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 3 + - 3556.2 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 4 + - 3281.84 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 3 + - 3930.75 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 7 + - 12.2279 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 3 + - 4336.2 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 6 + - 3474.12 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 2483.9 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 3819.24 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 3 + - 4022.48 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 108.675 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 2 + - 342.75 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 3 + - 4161.07 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 0 + - 3572.4 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 6 + - 3278.06 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 7 + - 21.307 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 2 + - 1532.18 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 3 + - 3314.65 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 2 + - 1868.42 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 0 + - 4019.86 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 0 + - 3758.65 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 6 + - 3130.46 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 1 + - 1112.35 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 7 + - 81.9581 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 0 + - 3796.02 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 3 + - 4291.75 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 5 + - 3058.7 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 4 + - 3492.85 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 0 + - 3764.21 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 2 + - 392.81 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 5 + - 2778.18 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 0 + - 3783.16 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 4 + - 2995.2 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 0 + - 3806.19 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 2205.16 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 3 + - 3991.52 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 3 + - 4131.3 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 2 + - 1498.85 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 1943.97 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 1 + - 2351.63 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 0 + - 4044.93 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 3 + - 3228.83 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 6 + - 3272.83 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 2539.14 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 2 + - 1252.53 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 4 + - 3504.5 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 2 + - 1451.8 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 0 + - 3374.04 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 7 + - 45.5761 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 1111.09 +- null diff --git a/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml new file mode 100644 index 000000000..156d94ddf --- /dev/null +++ b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml @@ -0,0 +1,19425 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 128 + LSCB: 64 + LSPA: 2 + LSPB: 4 + LVCA: 128 + LVCB: 64 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 1536 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 64 + LSCB: 64 + LSPA: 4 + LSPB: 4 + LVCA: 64 + LVCB: 64 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 1024 + LdsOffsetA: 0 + LdsOffsetB: 512 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 64 + LSPA: 8 + LSPB: 4 + LVCA: 8 + LVCB: 16 + LVPA: 2 + LVPB: 1 + LdcEqualsLdd: true + LdsNumElements: 1792 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 256 + LdsOffsetB_Blk: 1280 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x8_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 32 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 32 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 4 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x32x32_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 8 + LSPB: 4 + LVCA: 32 + LVCB: 64 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 4 + NumLoadsB: 8 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 8 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x32_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 4 + LSPB: 8 + LVCA: 64 + LVCB: 32 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 8 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 8 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x32x32_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 2 + LSPB: 4 + LVCA: 128 + LVCB: 64 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 4 + LSPB: 4 + LVCA: 64 + LVCB: 64 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 9 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 16 + LSPB: 8 + LVCA: 16 + LVCB: 32 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 10 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 4 + LSPB: 2 + LVCA: 64 + LVCB: 128 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 11 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 12 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU8_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 4 + LSPB: 2 + LVCA: 64 + LVCB: 128 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 13 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 14 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 256 + LdsOffsetA: 0 + LdsOffsetA_Blk: 512 + LdsOffsetB: 256 + LdsOffsetB_Blk: 768 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 15 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x32x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 4 + LSPB: 8 + LVCA: 64 + LVCB: 32 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 8 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 8 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 16 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x32x32_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 8 + LSPB: 16 + LVCA: 32 + LVCB: 16 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 17 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 18 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 8 + LSPB: 4 + LVCA: 32 + LVCB: 64 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 4 + NumLoadsB: 8 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 8 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 19 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x32_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 128 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 20 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x128x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 2 + LSPB: 4 + LVCA: 128 + LVCB: 64 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 21 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 2 + LSPB: 4 + LVCA: 128 + LVCB: 64 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 22 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 4 + LSPB: 2 + LVCA: 64 + LVCB: 128 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 23 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 2 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 4 + LSPB: 4 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 24 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT16x16x4_SE_AMAS2_GRVW2_GSU1_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 4 + LSPB: 4 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 25 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT16x16x4_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 26 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 27 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU4_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 28 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU8_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 29 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 30 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 31 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 5056 + - - 7 + - 3113.52 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1408 + - - 18 + - 3973.05 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 2944 + - - 4 + - 3266.22 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 256 + - - 7 + - 3329.42 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 128 + - 64 + - - 15 + - 53.3898 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 704 + - - 20 + - 4018.68 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1856 + - - 10 + - 4102.71 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 448 + - 6784 + - - 7 + - 3621.28 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 448 + - - 4 + - 3861.05 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1024 + - - 20 + - 2908.32 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 128 + - - 18 + - 3238.61 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1024 + - - 20 + - 3388.28 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 256 + - - 18 + - 3394.98 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 448 + - - 7 + - 3183.0 + - - - 4 + - 448 + - 1 + - 128 + - 4 + - 4 + - 4 + - 448 + - - 25 + - 4.11367 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 4288 + - - 9 + - 3031.84 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 128 + - - 7 + - 1951.19 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 6784 + - - 10 + - 4231.82 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1408 + - - 19 + - 1456.36 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 4 + - 6784 + - - 26 + - 205.608 + - - - 4288 + - 4 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 4 + - - 25 + - 38.9822 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 5056 + - - 17 + - 4222.14 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1408 + - - 7 + - 2826.2 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 4288 + - - 17 + - 4371.52 + - - - 2368 + - 6784 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 6784 + - - 0 + - 2500.56 + - - - 1024 + - 5888 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 5888 + - - 1 + - 2114.62 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 6784 + - - 18 + - 3082.34 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 448 + - - 18 + - 3636.87 + - - - 5056 + - 128 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 3 + - 876.031 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 128 + - - 7 + - 2456.41 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1408 + - - 27 + - 24.756 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1856 + - - 15 + - 1281.99 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 4288 + - - 17 + - 4139.4 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1856 + - - 18 + - 3944.73 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 64 + - 64 + - - 14 + - 42.2813 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 4 + - - 28 + - 0.483019 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 6784 + - - 10 + - 4138.18 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1024 + - - 4 + - 3184.4 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 256 + - - 4 + - 3449.9 + - - - 3584 + - 2944 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 2944 + - - 0 + - 2406.23 + - - - 5888 + - 448 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 448 + - - 0 + - 1716.36 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1024 + - - 8 + - 3623.83 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1856 + - - 18 + - 4018.68 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1856 + - - 18 + - 3399.06 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 704 + - - 4 + - 2698.09 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 2944 + - - 20 + - 4214.12 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1856 + - - 4 + - 3998.14 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 4 + - - 30 + - 258.72 + - - - 2944 + - 3584 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 3584 + - - 0 + - 2416.56 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 6784 + - - 17 + - 4430.11 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1024 + - - 28 + - 47.7784 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1856 + - - 18 + - 3703.11 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 5888 + - - 27 + - 371.686 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 5056 + - - 18 + - 3887.2 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 3584 + - - 10 + - 4042.43 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 128 + - - 14 + - 1500.06 + - - - 1856 + - 1408 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 1408 + - - 0 + - 1681.22 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 128 + - - 7 + - 1747.63 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1408 + - - 18 + - 3771.23 + - - - 1408 + - 5888 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 5888 + - - 1 + - 2287.38 + - - - 448 + - 4 + - 1 + - 128 + - 448 + - 448 + - 448 + - 4 + - - 25 + - 4.26037 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 2368 + - - 10 + - 3980.93 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 64 + - - 7 + - 830.207 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1856 + - - 10 + - 4012.71 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1408 + - - 18 + - 4020.65 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 3584 + - - 7 + - 2445.51 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 704 + - - 6 + - 1106.03 + - - - 1024 + - 1024 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 1024 + - - 1 + - 974.287 + - - - 1856 + - 2368 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 2368 + - - 1 + - 2019.54 + - - - 3584 + - 256 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 256 + - - 1 + - 1053.85 + - - - 4288 + - 1024 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 1024 + - - 0 + - 1930.07 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 4 + - 2944 + - - 27 + - 49.1948 + - - - 704 + - 128 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 3 + - 151.768 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 2368 + - - 7 + - 4174.92 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 128 + - - 12 + - 150.657 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 6784 + - - 10 + - 4287.21 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 704 + - 4 + - - 28 + - 13.8421 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 4288 + - - 10 + - 4137.71 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 452.291 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 2944 + - - 10 + - 3994.34 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 128 + - - 7 + - 2155.41 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 64 + - - 19 + - 1099.31 + - - - 1408 + - 5056 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 5056 + - - 0 + - 2168.32 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 128 + - - 18 + - 3018.97 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 704 + - 704 + - - 7 + - 2156.81 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1856 + - - 18 + - 3856.87 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 3584 + - - 10 + - 4040.35 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1408 + - - 4 + - 4006.97 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1024 + - - 15 + - 395.689 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 2368 + - - 18 + - 4161.31 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 5056 + - - 17 + - 4266.99 + - - - 704 + - 6784 + - 1 + - 128 + - 704 + - 704 + - 704 + - 6784 + - - 1 + - 2037.74 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 448 + - 704 + - - 4 + - 2232.86 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 4 + - 704 + - - 27 + - 13.3499 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 128 + - 704 + - - 7 + - 837.44 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 704 + - - 7 + - 3796.58 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 5056 + - - 18 + - 4068.92 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 2368 + - - 28 + - 260.606 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1408 + - - 18 + - 4171.04 + - - - 448 + - 64 + - 1 + - 128 + - 448 + - 448 + - 448 + - 64 + - - 3 + - 52.6696 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1408 + - - 15 + - 1763.66 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1024 + - - 17 + - 3621.89 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 4288 + - - 4 + - 3864.67 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 2944 + - - 10 + - 4263.67 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 2368 + - - 18 + - 3987.55 + - - - 1856 + - 128 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 388.262 + - - - 5056 + - 256 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 256 + - - 1 + - 1234.91 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1024 + - - 17 + - 2945.89 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 448 + - - 14 + - 433.369 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 2368 + - - 18 + - 3930.78 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3584 + - - 10 + - 4287.53 + - - - 4288 + - 6784 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 6784 + - - 0 + - 2601.23 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 2368 + - - 18 + - 4111.79 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 128 + - 448 + - - 15 + - 350.192 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 448 + - 2944 + - - 18 + - 3447.2 + - - - 2368 + - 4 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 4 + - - 25 + - 21.5581 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 448 + - - 4 + - 4069.89 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1408 + - - 4 + - 3078.35 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 704 + - 6784 + - - 18 + - 3982.71 + - - - 1024 + - 5056 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 5056 + - - 1 + - 2030.33 + - - - 1856 + - 64 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 64 + - - 3 + - 200.479 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1024 + - - 20 + - 3451.09 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1856 + - - 18 + - 4149.44 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 64 + - - 12 + - 134.063 + - - - 5888 + - 1856 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 1856 + - - 0 + - 2361.25 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 448 + - - 18 + - 3078.42 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 18 + - 2262.41 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 256 + - - 7 + - 2132.18 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1024 + - - 7 + - 754.371 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 5056 + - - 18 + - 4018.19 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 448 + - 448 + - - 15 + - 1105.43 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 6784 + - - 10 + - 4265.75 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 4288 + - - 10 + - 4189.99 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 5888 + - - 10 + - 4192.46 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 128 + - - 7 + - 2204.21 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 64 + - - 15 + - 531.047 + - - - 128 + - 4 + - 1 + - 128 + - 128 + - 128 + - 128 + - 4 + - - 25 + - 1.2282 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 5056 + - - 17 + - 4425.06 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1856 + - - 17 + - 3892.55 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 6784 + - - 4 + - 3886.67 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 128 + - - 7 + - 3056.13 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 4 + - - 28 + - 99.8689 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1408 + - - 18 + - 3710.78 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 5056 + - - 17 + - 4186.7 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 5056 + - - 18 + - 4089.12 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 128 + - 2368 + - - 15 + - 1556.87 + - - - 2944 + - 448 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 448 + - - 1 + - 1261.36 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 5888 + - - 10 + - 4314.13 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 7 + - 1769.07 + - - - 256 + - 64 + - 1 + - 128 + - 256 + - 256 + - 256 + - 64 + - - 3 + - 27.2783 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 64 + - - 19 + - 1937.05 + - - - 6784 + - 128 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 1110.6 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 4288 + - - 18 + - 4007.98 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 256 + - - 4 + - 3635.96 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 128 + - - 16 + - 273.678 + - - - 4288 + - 4288 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 4288 + - - 0 + - 2574.53 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 4 + - - 26 + - 203.68 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 4 + - - 28 + - 40.6862 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 4288 + - - 18 + - 4160.53 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 128 + - - 28 + - 14.4991 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 704 + - - 7 + - 2823.69 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 256 + - 2368 + - - 4 + - 2615.55 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1408 + - - 28 + - 178.849 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 704 + - - 7 + - 3949.11 + - - - 6784 + - 2944 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 2944 + - - 0 + - 2573.52 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 448 + - - 7 + - 2006.47 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 256 + - - 7 + - 2239.72 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1024 + - - 11 + - 3348.51 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1856 + - - 18 + - 4050.74 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1024 + - - 20 + - 3787.02 + - - - 64 + - 4288 + - 1 + - 128 + - 64 + - 64 + - 64 + - 4288 + - - 3 + - 411.519 + - - - 1408 + - 2368 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 2368 + - - 1 + - 1845.25 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 2944 + - - 4 + - 3625.7 + - - - 4 + - 1408 + - 1 + - 128 + - 4 + - 4 + - 4 + - 1408 + - - 25 + - 12.3105 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 64 + - - 4 + - 1628.97 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 2944 + - - 4 + - 3049.51 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 4 + - - 28 + - 7.88776 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1856 + - - 7 + - 3124.18 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1856 + - - 27 + - 32.4546 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 6784 + - - 10 + - 4259.01 + - - - 2368 + - 5888 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 5888 + - - 0 + - 2439.42 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 256 + - - 5 + - 415.341 + - - - 2368 + - 1856 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 1856 + - - 1 + - 2018.96 + - - - 2944 + - 4 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 4 + - - 25 + - 26.9168 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 4 + - - 30 + - 32.5882 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 704 + - 2368 + - - 18 + - 3002.04 + - - - 1856 + - 448 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 448 + - - 3 + - 1056.7 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 5888 + - - 17 + - 4367.53 + - - - 3584 + - 5056 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 5056 + - - 0 + - 2540.59 + - - - 5888 + - 2944 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 2944 + - - 0 + - 2558.8 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 704 + - - 20 + - 3946.11 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 256 + - - 4 + - 3182.39 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 2944 + - - 10 + - 4208.2 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3584 + - - 17 + - 4228.98 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 704 + - - 9 + - 2122.08 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1856 + - - 19 + - 1870.33 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 2944 + - - 18 + - 3985.41 + - - - 1408 + - 704 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 704 + - - 1 + - 1005.05 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 5056 + - - 4 + - 2745.48 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1856 + - - 7 + - 3908.07 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 4288 + - - 17 + - 4242.43 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1024 + - - 28 + - 92.6772 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 3584 + - - 20 + - 4352.28 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1408 + - - 18 + - 3835.15 + - - - 3584 + - 4 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 4 + - - 25 + - 32.7683 + - - - 2944 + - 5056 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 5056 + - - 0 + - 2467.45 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 2944 + - - 4 + - 3754.61 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 3584 + - - 10 + - 4248.22 + - - - 1856 + - 4288 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 4288 + - - 1 + - 2232.8 + - - - 1408 + - 1856 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 1856 + - - 0 + - 1688.69 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 64 + - 448 + - - 15 + - 182.044 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1856 + - - 10 + - 4055.91 + - - - 3584 + - 1408 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 1408 + - - 1 + - 2027.13 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 448 + - - 18 + - 3424.67 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 4 + - - 30 + - 190.48 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 6784 + - - 4 + - 3595.4 + - - - 448 + - 5056 + - 1 + - 128 + - 448 + - 448 + - 448 + - 5056 + - - 1 + - 1580.52 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1024 + - - 18 + - 2757.21 + - - - 1408 + - 4 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 4 + - - 25 + - 12.9846 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 256 + - 5056 + - - 18 + - 3390.35 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 5888 + - - 4 + - 3251.99 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 128 + - 5888 + - - 18 + - 2270.93 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 4 + - - 30 + - 59.1175 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 64 + - - 7 + - 1368.67 + - - - 5888 + - 1408 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 1408 + - - 1 + - 2299.27 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 2944 + - - 4 + - 3143.19 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 5888 + - - 17 + - 4258.38 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 256 + - - 4 + - 3139.1 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 128 + - 5888 + - - 4 + - 2825.14 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 256 + - - 19 + - 1845.66 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 2944 + - - 10 + - 3973.47 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 4288 + - - 7 + - 2232.13 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 6784 + - - 18 + - 4048.94 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 5888 + - - 18 + - 3939.39 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 7 + - 662.458 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 256 + - 4 + - - 28 + - 15.4809 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 3584 + - - 10 + - 4100.08 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 64 + - - 7 + - 1985.58 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 64 + - - 7 + - 1948.63 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 2368 + - - 18 + - 4086.94 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1408 + - - 19 + - 1081.73 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 3584 + - - 17 + - 3387.47 + - - - 448 + - 1408 + - 1 + - 128 + - 448 + - 448 + - 448 + - 1408 + - - 3 + - 856.752 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 4 + - - 26 + - 303.992 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 256 + - - 14 + - 1190.0 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1024 + - - 27 + - 18.3061 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 6784 + - - 10 + - 4419.48 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1024 + - - 7 + - 1435.7 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 2944 + - - 7 + - 3206.43 + - - - 64 + - 448 + - 1 + - 128 + - 64 + - 64 + - 64 + - 448 + - - 3 + - 45.466 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 448 + - - 7 + - 2334.16 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 64 + - 4288 + - - 7 + - 1961.69 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 5888 + - - 17 + - 4323.1 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 256 + - 2944 + - - 4 + - 2827.34 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 2368 + - - 7 + - 4048.01 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1024 + - - 14 + - 1117.34 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 2368 + - - 18 + - 3876.41 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 448 + - - 18 + - 3311.23 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 2368 + - - 28 + - 184.339 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 448 + - 4 + - - 31 + - 9.50978 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 704 + - 3584 + - - 4 + - 3359.52 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1408 + - - 9 + - 3238.2 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 775.397 + - - - 448 + - 1856 + - 1 + - 128 + - 448 + - 448 + - 448 + - 1856 + - - 3 + - 1035.32 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 3796.1 + - - - 704 + - 1856 + - 1 + - 128 + - 704 + - 704 + - 704 + - 1856 + - - 1 + - 1255.61 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 256 + - 128 + - - 7 + - 302.474 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 448 + - - 28 + - 46.1919 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 6784 + - - 4 + - 3748.81 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 2944 + - - 17 + - 4186.12 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 256 + - - 9 + - 2166.85 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 5056 + - - 18 + - 4053.85 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 4 + - 2944 + - - 27 + - 118.501 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 402.109 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 4 + - 3584 + - - 30 + - 59.0414 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3584 + - - 17 + - 4367.01 + - - - 256 + - 1408 + - 1 + - 128 + - 256 + - 256 + - 256 + - 1408 + - - 1 + - 482.205 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 704 + - - 18 + - 3021.1 + - - - 4288 + - 704 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 704 + - - 1 + - 1747.47 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 6784 + - - 10 + - 4285.98 + - - - 448 + - 4288 + - 1 + - 128 + - 448 + - 448 + - 448 + - 4288 + - - 2 + - 1632.31 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1856 + - - 18 + - 3969.34 + - - - 5056 + - 2368 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 2368 + - - 0 + - 2391.83 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 704 + - - 18 + - 3625.17 + - - - 2368 + - 1024 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 1024 + - - 0 + - 1546.33 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1024 + - - 18 + - 3481.25 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1408 + - - 18 + - 3864.35 + - - - 4288 + - 5888 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 5888 + - - 0 + - 2579.1 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 448 + - - 18 + - 3467.02 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 128 + - - 15 + - 1542.02 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 18 + - 3061.96 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1408 + - - 7 + - 834.209 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 704 + - 4 + - - 28 + - 36.0929 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 256 + - - 7 + - 1871.06 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3584 + - - 7 + - 2616.41 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 704 + - 3584 + - - 10 + - 3110.18 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3584 + - - 4 + - 3970.89 + - - - 6784 + - 3584 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 3584 + - - 0 + - 2645.33 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 4288 + - - 4 + - 3530.93 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 128 + - 5056 + - - 4 + - 2044.36 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 2368 + - - 4 + - 3056.02 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 64 + - - 7 + - 2652.19 + - - - 4288 + - 64 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 64 + - - 3 + - 414.237 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 6784 + - - 10 + - 4405.4 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 704 + - 2944 + - - 4 + - 3469.96 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1024 + - - 20 + - 4101.81 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 5888 + - - 18 + - 4137.88 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 4 + - - 27 + - 50.786 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1408 + - - 7 + - 2553.73 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 4 + - 4288 + - - 27 + - 67.1804 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 5888 + - - 18 + - 3948.79 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 448 + - 2368 + - - 18 + - 2507.21 + - - - 3584 + - 5888 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 5888 + - - 0 + - 2592.46 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 4 + - 4 + - - 28 + - 0.265744 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 64 + - - 7 + - 604.367 + - - - 4288 + - 1408 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 1408 + - - 1 + - 2130.57 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1856 + - - 7 + - 1093.31 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1408 + - - 7 + - 2743.78 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 448 + - - 4 + - 3883.56 + - - - 448 + - 256 + - 1 + - 128 + - 448 + - 448 + - 448 + - 256 + - - 3 + - 194.181 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 128 + - - 7 + - 1629.14 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 5056 + - - 18 + - 3988.79 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 256 + - - 28 + - 28.0411 + - - - 6784 + - 5056 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 5056 + - - 0 + - 2709.18 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3584 + - - 4 + - 3666.3 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1024 + - - 20 + - 3268.29 + - - - 5056 + - 64 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 64 + - - 3 + - 480.719 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 704 + - - 7 + - 3478.45 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 6784 + - - 10 + - 3993.99 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 704 + - 4288 + - - 18 + - 3350.68 + - - - 64 + - 5056 + - 1 + - 128 + - 64 + - 64 + - 64 + - 5056 + - - 3 + - 468.962 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1024 + - - 18 + - 2733.19 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 5056 + - - 10 + - 4249.37 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 704 + - - 7 + - 4025.83 + - - - 2944 + - 64 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 64 + - - 3 + - 317.332 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 704 + - - 9 + - 3259.19 + - - - 4 + - 64 + - 1 + - 128 + - 4 + - 4 + - 4 + - 64 + - - 25 + - 0.548331 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 2944 + - - 10 + - 4243.62 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1408 + - - 18 + - 3974.97 + - - - 256 + - 5888 + - 1 + - 128 + - 256 + - 256 + - 256 + - 5888 + - - 1 + - 1294.54 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1024 + - - 22 + - 3589.81 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 4 + - - 27 + - 158.022 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1856 + - - 18 + - 3321.05 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 128 + - - 11 + - 2726.97 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 64 + - 64 + - - 7 + - 22.2533 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 256 + - - 4 + - 3759.56 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 6784 + - - 10 + - 4303.45 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1024 + - - 7 + - 2194.33 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 4288 + - - 17 + - 4360.59 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 128 + - 3584 + - - 7 + - 2168.4 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 4 + - 3584 + - - 27 + - 139.297 + - - - 6784 + - 2368 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 2368 + - - 0 + - 2519.43 + - - - 128 + - 256 + - 1 + - 128 + - 128 + - 128 + - 128 + - 256 + - - 3 + - 56.0137 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 2944 + - - 18 + - 3243.75 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 448 + - - 7 + - 3055.04 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 2368 + - - 10 + - 4208.91 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 3584 + - - 4 + - 3420.14 + - - - 128 + - 2944 + - 1 + - 128 + - 128 + - 128 + - 128 + - 2944 + - - 3 + - 523.833 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 704 + - - 14 + - 1522.61 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1856 + - - 18 + - 3832.47 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3584 + - - 17 + - 4119.44 + - - - 2944 + - 128 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 3 + - 581.419 + - - - 1856 + - 6784 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 2409.21 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 4288 + - - 20 + - 4380.09 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 3584 + - - 10 + - 4080.5 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 448 + - - 7 + - 3829.87 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3584 + - - 20 + - 4390.34 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 5888 + - - 10 + - 4275.07 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 256 + - - 7 + - 2619.08 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 448 + - - 7 + - 3663.47 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 704 + - - 18 + - 2339.19 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 448 + - - 4 + - 3377.32 + - - - 6784 + - 1024 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 1024 + - - 0 + - 2125.22 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 2368 + - - 18 + - 4016.29 + - - - 1024 + - 1408 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 1408 + - - 1 + - 1375.59 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 4 + - - 29 + - 99.9254 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 817.831 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 4288 + - - 10 + - 4202.31 + - - - 3584 + - 1856 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 1856 + - - 0 + - 2196.26 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 2944 + - - 18 + - 3930.31 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 5888 + - - 17 + - 4306.91 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 128 + - 5056 + - - 4 + - 2797.3 + - - - 5888 + - 1024 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 1024 + - - 0 + - 2050.35 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 6784 + - - 7 + - 3450.0 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 704 + - - 7 + - 3637.63 + - - - 256 + - 2944 + - 1 + - 128 + - 256 + - 256 + - 256 + - 2944 + - - 1 + - 901.917 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3584 + - - 10 + - 4071.21 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 448 + - 128 + - - 15 + - 354.249 + - - - 1856 + - 4 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 4 + - - 25 + - 16.8251 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 6784 + - - 10 + - 4393.61 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 2368 + - - 18 + - 4075.35 + - - - 448 + - 704 + - 1 + - 128 + - 448 + - 448 + - 448 + - 704 + - - 3 + - 501.617 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 4288 + - - 17 + - 4322.53 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 2368 + - - 18 + - 3765.74 + - - - 2944 + - 4288 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 4288 + - - 0 + - 2496.38 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 2944 + - - 7 + - 2034.97 + - - - 1856 + - 1024 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 1024 + - - 2 + - 1544.37 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 704 + - - 7 + - 3674.62 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 2944 + - - 20 + - 4252.0 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 704 + - - 4 + - 3858.27 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1856 + - - 17 + - 4287.04 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 5056 + - - 18 + - 3869.6 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1856 + - - 20 + - 3695.33 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 448 + - - 7 + - 3465.82 + - - - 4288 + - 448 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 448 + - - 2 + - 1651.61 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 256 + - - 7 + - 3075.82 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 704 + - - 4 + - 3504.25 + - - - 704 + - 4288 + - 1 + - 128 + - 704 + - 704 + - 704 + - 4288 + - - 1 + - 1728.71 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1856 + - - 18 + - 4128.67 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 704 + - 2944 + - - 18 + - 3021.52 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 765.042 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 5056 + - - 10 + - 4278.86 + - - - 64 + - 2368 + - 1 + - 128 + - 64 + - 64 + - 64 + - 2368 + - - 3 + - 250.241 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 448 + - - 18 + - 2868.8 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 2368 + - - 4 + - 3289.5 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 64 + - - 12 + - 248.026 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 5056 + - - 17 + - 4065.98 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3584 + - - 21 + - 3791.52 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1408 + - - 18 + - 3892.98 + - - - 448 + - 3584 + - 1 + - 128 + - 448 + - 448 + - 448 + - 3584 + - - 2 + - 1458.84 + - - - 128 + - 1408 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1408 + - - 3 + - 306.438 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1024 + - - 17 + - 3394.41 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 704 + - - 4 + - 1946.49 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 2378.82 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 6784 + - - 10 + - 4373.11 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 3584 + - - 17 + - 4095.54 + - - - 5888 + - 5056 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 5056 + - - 0 + - 2660.24 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 64 + - - 4 + - 2292.55 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 128 + - - 28 + - 20.4211 + - - - 4288 + - 128 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 3 + - 757.707 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 704 + - 2368 + - - 18 + - 3294.34 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 5888 + - - 10 + - 4325.87 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 3396.85 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 2646.84 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 5056 + - - 7 + - 3248.34 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 64 + - - 7 + - 3192.06 + - - - 5056 + - 5056 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 5056 + - - 0 + - 2591.14 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 448 + - - 4 + - 4200.73 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 704 + - 256 + - - 7 + - 1616.96 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 64 + - - 4 + - 3663.64 + - - - 2368 + - 2368 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 2368 + - - 1 + - 2102.13 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1024 + - - 7 + - 1198.37 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 448 + - - 7 + - 2693.0 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 4288 + - - 18 + - 3843.54 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 2944 + - - 10 + - 4104.08 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 448 + - - 6 + - 1832.89 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 704 + - - 9 + - 2854.84 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 704 + - 5888 + - - 18 + - 3598.61 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 4 + - 256 + - - 28 + - 15.1237 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 64 + - - 14 + - 1539.49 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1408 + - - 4 + - 3051.08 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 128 + - 448 + - - 4 + - 532.401 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 704 + - - 4 + - 3602.24 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 256 + - - 4 + - 3264.52 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 3584 + - - 17 + - 4359.56 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 448 + - - 7 + - 2737.58 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1856 + - - 18 + - 3676.41 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 704 + - 64 + - - 7 + - 415.902 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 64 + - - 7 + - 3473.41 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 256 + - 704 + - - 4 + - 1601.99 + - - - 6784 + - 6784 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 6784 + - - 0 + - 2747.11 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 128 + - 128 + - - 15 + - 107.657 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 2368 + - - 18 + - 3661.38 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 2368 + - - 18 + - 3993.21 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 64 + - 704 + - - 7 + - 417.911 + - - - 1856 + - 704 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 704 + - - 1 + - 1258.64 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 4288 + - - 10 + - 4225.49 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 448 + - 4 + - - 31 + - 24.9322 + - - - 64 + - 1024 + - 1 + - 128 + - 64 + - 64 + - 64 + - 1024 + - - 3 + - 110.145 + - - - 2944 + - 1856 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 1856 + - - 0 + - 2084.03 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 64 + - - 7 + - 1046.76 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 3584 + - - 10 + - 4278.32 + - - - 3584 + - 6784 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 6784 + - - 0 + - 2641.2 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 256 + - 6784 + - - 18 + - 3413.67 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 15 + - 996.057 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 704 + - - 18 + - 3029.81 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 2368 + - - 4 + - 2464.44 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 5888 + - - 20 + - 4117.44 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 128 + - 3584 + - - 4 + - 3161.54 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1024 + - - 19 + - 804.387 + - - - 4288 + - 5056 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 5056 + - - 0 + - 2562.86 + - - - 1856 + - 1856 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 1856 + - - 1 + - 1826.84 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1024 + - - 17 + - 3404.05 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 1010.42 + - - - 1856 + - 5888 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 5888 + - - 1 + - 2349.51 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 4 + - 5056 + - - 27 + - 176.822 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1408 + - - 23 + - 3492.59 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 3584 + - - 18 + - 2711.0 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 64 + - - 7 + - 2631.56 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1024 + - - 18 + - 3653.64 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 64 + - - 12 + - 156.437 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 128 + - 2944 + - - 4 + - 1841.01 + - - - 1856 + - 2944 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 2944 + - - 0 + - 2090.01 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 4 + - 2368 + - - 27 + - 40.0931 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 128 + - - 12 + - 243.942 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 256 + - - 18 + - 3403.22 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 4288 + - - 17 + - 4292.66 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 256 + - - 7 + - 2924.32 + - - - 448 + - 5888 + - 1 + - 128 + - 448 + - 448 + - 448 + - 5888 + - - 1 + - 1660.31 + - - - 1408 + - 6784 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 6784 + - - 0 + - 2379.79 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 6784 + - - 10 + - 4355.93 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 4288 + - - 18 + - 4020.58 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 4 + - - 30 + - 303.241 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 3584 + - - 17 + - 4253.07 + - - - 2944 + - 1024 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 1024 + - - 1 + - 1581.98 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 6784 + - - 26 + - 343.851 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 448 + - - 7 + - 3013.1 + - - - 4 + - 1856 + - 1 + - 128 + - 4 + - 4 + - 4 + - 1856 + - - 25 + - 16.9209 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 448 + - 64 + - - 15 + - 181.325 + - - - 128 + - 64 + - 1 + - 128 + - 128 + - 128 + - 128 + - 64 + - - 3 + - 14.1394 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 128 + - - 15 + - 1290.69 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 704 + - 6784 + - - 18 + - 3783.86 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 64 + - - 7 + - 870.676 + - - - 5888 + - 704 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 704 + - - 1 + - 1953.54 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 3584 + - - 20 + - 4095.68 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1856 + - - 18 + - 3428.15 + - - - 256 + - 5056 + - 1 + - 128 + - 256 + - 256 + - 256 + - 5056 + - - 1 + - 1252.08 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2944 + - - 18 + - 2286.0 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 490.644 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1856 + - - 20 + - 4151.88 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 448 + - - 18 + - 2496.15 + - - - 2944 + - 2944 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 2944 + - - 0 + - 2350.01 + - - - 64 + - 256 + - 1 + - 128 + - 64 + - 64 + - 64 + - 256 + - - 3 + - 26.2669 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 3965.53 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 5056 + - - 10 + - 4320.66 + - - - 1408 + - 3584 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 3584 + - - 1 + - 2021.04 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 64 + - - 28 + - 7.7913 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 3584 + - - 10 + - 4019.58 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 256 + - - 14 + - 264.41 + - - - 704 + - 1408 + - 1 + - 128 + - 704 + - 704 + - 704 + - 1408 + - - 1 + - 1042.03 + - - - 2368 + - 704 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 704 + - - 2 + - 1443.35 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 6784 + - - 18 + - 3944.76 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1024 + - - 4 + - 3656.96 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 64 + - 4 + - - 28 + - 4.39642 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 704 + - 128 + - - 4 + - 831.004 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 2944 + - - 18 + - 3875.96 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1856 + - - 4 + - 3831.19 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1024 + - - 20 + - 3930.41 + - - - 1024 + - 2368 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 2368 + - - 1 + - 1655.18 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 64 + - - 7 + - 1858.03 + - - - 704 + - 5056 + - 1 + - 128 + - 704 + - 704 + - 704 + - 5056 + - - 1 + - 1836.53 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 448 + - - 18 + - 3133.99 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 6784 + - - 4 + - 4087.96 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 4288 + - - 4 + - 4202.05 + - - - 448 + - 2944 + - 1 + - 128 + - 448 + - 448 + - 448 + - 2944 + - - 1 + - 1259.1 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 64 + - 448 + - - 4 + - 266.2 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 256 + - 64 + - - 4 + - 150.802 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 2368 + - - 18 + - 4150.08 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 448 + - - 7 + - 3869.44 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 6784 + - - 10 + - 4228.86 + - - - 1024 + - 4288 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 4288 + - - 1 + - 2006.13 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1024 + - - 18 + - 3398.52 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1408 + - - 10 + - 4189.86 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 64 + - - 19 + - 1489.79 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 256 + - 5888 + - - 4 + - 3157.4 + - - - 2368 + - 128 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 3 + - 485.452 + - - - 1024 + - 1856 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 1856 + - - 1 + - 1565.04 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1408 + - - 7 + - 3090.7 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 256 + - - 4 + - 3104.03 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 128 + - - 18 + - 2621.44 + - - - 4 + - 4 + - 1 + - 128 + - 4 + - 4 + - 4 + - 4 + - - 25 + - 0.0345949 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 64 + - 6784 + - - 7 + - 3046.85 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 128 + - 4 + - - 30 + - 3.30323 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 2368 + - - 7 + - 1646.35 + - - - 704 + - 64 + - 1 + - 128 + - 704 + - 704 + - 704 + - 64 + - - 3 + - 79.7451 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1856 + - - 7 + - 2752.11 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1856 + - - 17 + - 4081.4 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 4288 + - - 18 + - 3797.55 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 5056 + - - 20 + - 3949.43 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 256 + - - 19 + - 1383.42 + - - - 2368 + - 448 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 448 + - - 1 + - 1038.79 + - - - 2368 + - 64 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 64 + - - 3 + - 257.961 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 3584 + - - 4 + - 3602.42 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 448 + - - 4 + - 3615.0 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 2944 + - - 7 + - 2198.01 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 704 + - 64 + - - 15 + - 280.504 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 4 + - 64 + - - 31 + - 1.66504 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 2368 + - - 7 + - 2924.63 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 5056 + - - 18 + - 3738.15 + - - - 4288 + - 2944 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 2408.85 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 2944 + - - 4 + - 3834.69 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1024 + - - 11 + - 3654.42 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 256 + - - 4 + - 3688.11 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 5056 + - - 4 + - 3978.54 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 6784 + - - 10 + - 4112.92 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 448 + - 448 + - - 7 + - 1769.29 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 2944 + - - 20 + - 4115.75 + - - - 3584 + - 3584 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 3584 + - - 0 + - 2393.12 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 2944 + - - 28 + - 205.439 + - - - 5056 + - 2944 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 2944 + - - 0 + - 2466.94 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 128 + - - 9 + - 2755.49 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 448 + - - 7 + - 2559.7 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 2944 + - - 10 + - 4289.38 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 4 + - 5888 + - - 26 + - 89.4026 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 128 + - 2944 + - - 7 + - 2652.19 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 5888 + - - 20 + - 4387.06 + - - - 6784 + - 4 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 4 + - - 25 + - 60.8948 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 64 + - - 7 + - 2232.13 + - - - 5888 + - 3584 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 3584 + - - 0 + - 2599.05 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 4288 + - - 27 + - 262.078 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1856 + - - 4 + - 4030.52 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1024 + - - 18 + - 2883.83 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 3584 + - - 10 + - 4219.95 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 128 + - - 18 + - 2826.24 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 128 + - - 15 + - 212.262 + - - - 5888 + - 6784 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 6784 + - - 0 + - 2725.29 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 128 + - - 15 + - 1008.25 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 5888 + - - 18 + - 4094.36 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 6784 + - - 4 + - 3695.82 + - - - 128 + - 4288 + - 1 + - 128 + - 128 + - 128 + - 128 + - 4288 + - - 3 + - 679.708 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 2368 + - - 10 + - 4095.54 + - - - 3584 + - 4288 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 4288 + - - 0 + - 2510.89 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 4288 + - - 27 + - 336.41 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 64 + - - 19 + - 807.929 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1408 + - - 18 + - 3957.28 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1408 + - - 18 + - 2323.77 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 5888 + - - 18 + - 3895.64 + - - - 64 + - 128 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 3 + - 13.2396 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 3584 + - - 17 + - 4007.14 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1408 + - - 18 + - 3843.87 + - - - 4 + - 6784 + - 1 + - 128 + - 4 + - 4 + - 4 + - 6784 + - - 24 + - 60.7244 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 5056 + - - 18 + - 4011.8 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3584 + - - 27 + - 299.839 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 64 + - 4 + - - 30 + - 1.77701 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1024 + - - 17 + - 3679.32 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 5888 + - - 18 + - 4172.63 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 256 + - - 28 + - 40.1495 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 5056 + - - 18 + - 4015.24 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 256 + - 448 + - - 7 + - 1056.63 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 3584 + - - 17 + - 4099.34 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 256 + - - 7 + - 3818.82 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 64 + - - 7 + - 1687.31 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 4288 + - - 17 + - 4338.94 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1856 + - - 28 + - 157.033 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1856 + - - 18 + - 3018.91 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 256 + - - 23 + - 3172.11 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 6784 + - - 17 + - 4204.59 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1024 + - - 18 + - 2847.39 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 5888 + - - 18 + - 4149.61 + - - - 5056 + - 4288 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 4288 + - - 0 + - 2562.86 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 6784 + - - 4 + - 3986.64 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 4288 + - - 4 + - 2662.89 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 128 + - - 7 + - 1192.69 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 4 + - - 27 + - 78.0661 + - - - 256 + - 3584 + - 1 + - 128 + - 256 + - 256 + - 256 + - 3584 + - - 1 + - 1038.93 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 698.744 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 704 + - - 28 + - 98.525 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1024 + - - 17 + - 3545.23 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 3584 + - - 17 + - 4326.23 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 704 + - 5056 + - - 18 + - 3478.97 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 6784 + - - 17 + - 4218.14 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1408 + - - 18 + - 3632.12 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1408 + - - 15 + - 996.057 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1024 + - - 17 + - 3544.86 + - - - 6784 + - 256 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 256 + - - 2 + - 1537.76 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 64 + - - 7 + - 3020.35 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 704 + - - 7 + - 2409.24 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 31 + - 5.70871 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 4 + - - 26 + - 341.665 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 4 + - - 31 + - 203.067 + - - - 128 + - 3584 + - 1 + - 128 + - 128 + - 128 + - 128 + - 3584 + - - 3 + - 609.637 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 3751.53 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 128 + - - 7 + - 3666.09 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 4 + - - 30 + - 314.513 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 4288 + - - 17 + - 4302.74 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 64 + - 3584 + - - 4 + - 1980.22 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 256 + - - 23 + - 3486.71 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 128 + - - 7 + - 3194.01 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 2368 + - - 18 + - 3916.28 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 2944 + - - 18 + - 3613.32 + - - - 256 + - 448 + - 1 + - 128 + - 256 + - 256 + - 256 + - 448 + - - 3 + - 195.63 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 2368 + - - 10 + - 4219.07 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1024 + - - 13 + - 3334.33 + - - - 5056 + - 3584 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 3584 + - - 0 + - 2541.48 + - - - 128 + - 448 + - 1 + - 128 + - 128 + - 128 + - 128 + - 448 + - - 3 + - 98.4446 + - - - 5056 + - 4 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 4 + - - 25 + - 45.5115 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1856 + - - 7 + - 684.881 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 64 + - - 15 + - 1638.4 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 256 + - - 7 + - 2572.71 + - - - 704 + - 448 + - 1 + - 128 + - 704 + - 704 + - 704 + - 448 + - - 3 + - 507.163 + - - - 1024 + - 6784 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 6784 + - - 1 + - 2163.7 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 2944 + - - 18 + - 4017.85 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1408 + - - 18 + - 2895.43 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 5056 + - - 17 + - 4221.24 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 704 + - - 5 + - 961.688 + - - - 128 + - 704 + - 1 + - 128 + - 128 + - 128 + - 128 + - 704 + - - 3 + - 153.545 + - - - 128 + - 5056 + - 1 + - 128 + - 128 + - 128 + - 128 + - 5056 + - - 3 + - 786.233 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 15 + - 397.942 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 64 + - - 12 + - 87.6317 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 448 + - - 28 + - 66.5006 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 5888 + - - 10 + - 4293.47 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 5056 + - - 18 + - 4110.19 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 128 + - 704 + - - 7 + - 530.071 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 5056 + - - 17 + - 4385.19 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 448 + - 64 + - - 7 + - 265.43 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 128 + - - 11 + - 3079.28 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 4288 + - - 18 + - 4112.83 + - - - 4288 + - 1856 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 1856 + - - 1 + - 2206.49 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 2944 + - - 10 + - 4255.37 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1408 + - - 4 + - 3177.6 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 704 + - - 7 + - 3550.0 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1024 + - - 17 + - 3641.44 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 3584 + - - 17 + - 4170.99 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 448 + - - 5 + - 1195.15 + - - - 64 + - 64 + - 1 + - 128 + - 64 + - 64 + - 64 + - 64 + - - 3 + - 6.32587 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 2944 + - - 10 + - 4257.95 + - - - 1408 + - 2944 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 2944 + - - 1 + - 1924.62 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 2944 + - - 18 + - 3974.12 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 448 + - - 4 + - 2165.2 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 704 + - - 7 + - 2558.78 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 256 + - - 4 + - 3802.07 + - - - 256 + - 1024 + - 1 + - 128 + - 256 + - 256 + - 256 + - 1024 + - - 1 + - 361.266 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 448 + - - 6 + - 1342.92 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 64 + - 2368 + - - 7 + - 861.397 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1408 + - - 7 + - 533.997 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 4 + - - 27 + - 253.563 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 5056 + - - 10 + - 4232.24 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1024 + - - 4 + - 2131.41 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 4288 + - - 10 + - 4277.59 + - - - 2944 + - 1408 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 1408 + - - 1 + - 1943.8 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 4 + - 704 + - - 28 + - 35.338 + - - - 64 + - 1408 + - 1 + - 128 + - 64 + - 64 + - 64 + - 1408 + - - 3 + - 151.131 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 6784 + - - 4 + - 3809.69 + - - - 6784 + - 1408 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 1408 + - - 0 + - 2365.06 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 704 + - - 7 + - 3542.33 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 5888 + - - 17 + - 4406.81 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 5888 + - - 27 + - 299.244 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 5888 + - - 10 + - 4351.82 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 4288 + - - 17 + - 4330.78 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 4288 + - - 10 + - 4026.38 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1024 + - - 18 + - 2237.5 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 5056 + - - 10 + - 4263.29 + - - - 448 + - 448 + - 1 + - 128 + - 448 + - 448 + - 448 + - 448 + - - 3 + - 340.176 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 2944 + - - 18 + - 3891.51 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 5056 + - - 18 + - 4129.48 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1408 + - - 4 + - 3598.35 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 2368 + - - 18 + - 3792.02 + - - - 6784 + - 64 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 64 + - - 3 + - 654.126 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 5056 + - - 20 + - 4019.33 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 448 + - - 4 + - 4052.05 + - - - 704 + - 3584 + - 1 + - 128 + - 704 + - 704 + - 704 + - 3584 + - - 0 + - 1618.69 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 448 + - - 4 + - 3986.63 + - - - 128 + - 5888 + - 1 + - 128 + - 128 + - 128 + - 128 + - 5888 + - - 1 + - 891.91 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1856 + - - 17 + - 4117.54 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 704 + - - 4 + - 4106.76 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 4 + - - 27 + - 245.186 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 2368 + - - 9 + - 2680.52 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 2368 + - - 10 + - 4021.64 + - - - 4288 + - 3584 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 3584 + - - 0 + - 2519.38 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 704 + - 5056 + - - 20 + - 3749.64 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1856 + - - 7 + - 3682.38 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 6784 + - - 18 + - 3883.84 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 6784 + - - 26 + - 293.93 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 448 + - 5888 + - - 18 + - 3609.34 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 2944 + - - 10 + - 4137.99 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 5056 + - - 18 + - 3991.76 + - - - 2368 + - 3584 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 3584 + - - 0 + - 2301.54 + - - - 256 + - 1856 + - 1 + - 128 + - 256 + - 256 + - 256 + - 1856 + - - 1 + - 618.566 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1024 + - - 11 + - 3788.93 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 256 + - - 4 + - 3555.3 + - - - 704 + - 1024 + - 1 + - 128 + - 704 + - 704 + - 704 + - 1024 + - - 3 + - 893.442 + - - - 1024 + - 3584 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 3584 + - - 1 + - 1864.73 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1408 + - - 10 + - 3973.22 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 4288 + - - 4 + - 3408.06 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 5888 + - - 18 + - 4186.47 + - - - 4 + - 2368 + - 1 + - 128 + - 4 + - 4 + - 4 + - 2368 + - - 25 + - 21.6196 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1856 + - - 20 + - 3843.69 + - - - 1408 + - 1024 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 1024 + - - 1 + - 1363.4 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 128 + - 128 + - - 7 + - 151.968 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 704 + - - 7 + - 3695.08 + - - - 2944 + - 5888 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 5888 + - - 0 + - 2565.43 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 4 + - - 31 + - 25.3124 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1856 + - - 28 + - 225.76 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 64 + - - 4 + - 2012.65 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 4 + - - 27 + - 40.9047 + - - - 4 + - 128 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 25 + - 1.14255 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 2368 + - - 18 + - 3836.34 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 704 + - - 18 + - 3800.79 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1856 + - - 18 + - 2529.24 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 256 + - 4288 + - - 4 + - 3105.86 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1408 + - - 18 + - 3891.51 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3584 + - - 4 + - 3521.42 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 2368 + - - 18 + - 3970.99 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 4288 + - - 4 + - 4071.82 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1856 + - - 18 + - 3848.19 + - - - 704 + - 2368 + - 1 + - 128 + - 704 + - 704 + - 704 + - 2368 + - - 2 + - 1506.11 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1408 + - - 4 + - 3640.04 + - - - 2944 + - 704 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 704 + - - 1 + - 1502.55 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 6784 + - - 10 + - 4270.68 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1024 + - - 7 + - 604.367 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 2368 + - - 4 + - 3552.7 + - - - 5888 + - 2368 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 2368 + - - 0 + - 2425.89 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 704 + - - 31 + - 67.4635 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 704 + - - 4 + - 3388.18 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 704 + - - 7 + - 3647.13 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 5888 + - - 4 + - 3869.31 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 3584 + - - 20 + - 4239.5 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 128 + - 6784 + - - 7 + - 3237.35 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 4 + - - 28 + - 154.984 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 4288 + - - 18 + - 3993.7 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 704 + - 128 + - - 7 + - 535.982 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 2368 + - - 9 + - 1832.19 + - - - 5056 + - 5888 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 5888 + - - 0 + - 2645.76 + - - - 4 + - 1024 + - 1 + - 128 + - 4 + - 4 + - 4 + - 1024 + - - 24 + - 9.1023 + - - - 5056 + - 1024 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 1024 + - - 0 + - 1991.29 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 4 + - - 27 + - 70.0976 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 4 + - 128 + - - 27 + - 3.33686 + - - - 2944 + - 256 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 256 + - - 3 + - 942.08 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 4 + - 128 + - - 31 + - 7.94055 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 5888 + - - 18 + - 4111.91 + - - - 64 + - 3584 + - 1 + - 128 + - 64 + - 64 + - 64 + - 3584 + - - 3 + - 366.635 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1408 + - - 10 + - 4186.8 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 4288 + - - 17 + - 4328.17 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 4 + - - 27 + - 283.047 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 5056 + - - 10 + - 4255.14 + - - - 64 + - 6784 + - 1 + - 128 + - 64 + - 64 + - 64 + - 6784 + - - 3 + - 593.238 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 6784 + - - 18 + - 3577.38 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3584 + - - 17 + - 4261.24 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1408 + - - 18 + - 3916.76 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 2368 + - - 18 + - 4146.85 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 5888 + - - 18 + - 4023.53 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1024 + - - 18 + - 3312.88 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 128 + - - 18 + - 3464.75 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 4 + - - 31 + - 18.4869 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 7 + - 2245.84 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 5888 + - - 18 + - 4052.77 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 5888 + - - 17 + - 4290.43 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 4 + - - 31 + - 65.9356 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 704 + - 5888 + - - 18 + - 3830.35 + - - - 1408 + - 256 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 256 + - - 3 + - 570.442 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1856 + - - 28 + - 82.6803 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 64 + - - 7 + - 2121.17 + - - - 5888 + - 256 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 256 + - - 1 + - 1272.01 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 7 + - 106.131 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 2944 + - - 10 + - 4169.27 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 704 + - - 18 + - 3340.25 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 704 + - - 4 + - 3509.94 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 5056 + - - 17 + - 4418.77 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1024 + - - 17 + - 3243.02 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 64 + - 128 + - - 14 + - 78.408 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 5888 + - - 17 + - 4295.2 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 448 + - - 4 + - 3950.48 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 2368 + - - 7 + - 4080.47 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 5056 + - - 4 + - 3768.51 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 5056 + - - 20 + - 4242.36 + - - - 448 + - 1024 + - 1 + - 128 + - 448 + - 448 + - 448 + - 1024 + - - 3 + - 675.878 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1856 + - - 19 + - 1369.41 + - - - 4 + - 256 + - 1 + - 128 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 2.30114 + - - - 256 + - 256 + - 1 + - 128 + - 256 + - 256 + - 256 + - 256 + - - 3 + - 110.609 + - - - 256 + - 4 + - 1 + - 128 + - 256 + - 256 + - 256 + - 4 + - - 25 + - 2.47495 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 64 + - - 4 + - 2620.49 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 4 + - 5056 + - - 30 + - 77.4124 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 15 + - 205.201 + - - - 1024 + - 448 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 448 + - - 1 + - 598.698 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 2944 + - - 18 + - 3797.83 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 5056 + - - 4 + - 3639.16 + - - - 256 + - 128 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 3 + - 54.4432 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 6784 + - - 10 + - 4240.62 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 2944 + - - 10 + - 4111.07 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 128 + - - 9 + - 3085.51 + - - - 6784 + - 704 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 704 + - - 0 + - 2080.45 + - - - 4 + - 5056 + - 1 + - 128 + - 4 + - 4 + - 4 + - 5056 + - - 25 + - 45.7044 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 4 + - 2368 + - - 28 + - 99.8147 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1024 + - - 9 + - 1598.53 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 4 + - - 30 + - 173.349 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 5056 + - - 18 + - 3940.89 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 5056 + - - 10 + - 4331.25 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 2368 + - - 18 + - 4108.37 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 5888 + - - 17 + - 4331.86 + - - - 1856 + - 256 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 256 + - - 3 + - 700.016 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1024 + - - 17 + - 3335.93 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 64 + - - 4 + - 2181.49 + - - - 3584 + - 128 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 3 + - 619.935 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 5888 + - - 18 + - 4130.53 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 6784 + - - 4 + - 3678.56 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 448 + - - 4 + - 3782.24 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 4 + - - 26 + - 291.814 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 6784 + - - 10 + - 4101.34 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1024 + - - 4 + - 3865.52 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1856 + - - 18 + - 3882.67 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 64 + - - 15 + - 103.819 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 4 + - - 28 + - 136.643 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 5888 + - - 4 + - 3770.73 + - - - 5888 + - 5888 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 5888 + - - 0 + - 2683.46 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 256 + - - 4 + - 4030.52 + - - - 3584 + - 448 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 448 + - - 1 + - 1310.05 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 4 + - 64 + - - 28 + - 4.2965 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 128 + - 4288 + - - 7 + - 1735.54 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 128 + - - 7 + - 2673.75 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 6784 + - - 10 + - 4399.08 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 5888 + - - 4 + - 3959.55 + - - - 1408 + - 1408 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 1408 + - - 1 + - 1424.95 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 64 + - - 8 + - 2768.63 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 5888 + - - 18 + - 3704.65 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 64 + - 2944 + - - 15 + - 1032.42 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1024 + - - 4 + - 1857.26 + - - - 128 + - 128 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 26.8041 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 4288 + - - 17 + - 4073.06 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 6784 + - - 10 + - 4426.76 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1408 + - - 18 + - 4125.6 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 4288 + - - 18 + - 4117.75 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1024 + - - 17 + - 3585.52 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1856 + - - 17 + - 4271.66 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 5056 + - - 20 + - 4195.67 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1408 + - - 18 + - 3657.61 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 128 + - 4 + - - 31 + - 7.9534 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 5888 + - - 10 + - 4203.36 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1408 + - - 18 + - 3912.3 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 4288 + - - 18 + - 3756.56 + - - - 1024 + - 2944 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 2944 + - - 1 + - 1734.43 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 2368 + - - 18 + - 3984.42 + - - - 2368 + - 2944 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 2944 + - - 1 + - 2173.05 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1408 + - - 18 + - 4054.06 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 5888 + - - 17 + - 4259.72 + - - - 128 + - 1024 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1024 + - - 3 + - 220.058 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 4 + - - 28 + - 14.9139 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 5888 + - - 4 + - 3444.97 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1856 + - - 7 + - 2088.51 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 448 + - - 4 + - 3408.93 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 2944 + - - 10 + - 4283.69 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 704 + - - 15 + - 996.057 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 4288 + - - 18 + - 3974.62 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 4 + - - 27 + - 139.438 + - - - 6784 + - 5888 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 5888 + - - 0 + - 2722.04 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 2944 + - - 28 + - 282.028 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 2368 + - - 18 + - 4126.13 + - - - 448 + - 6784 + - 1 + - 128 + - 448 + - 448 + - 448 + - 6784 + - - 1 + - 1737.95 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 704 + - - 7 + - 3707.38 + - - - 1024 + - 64 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 64 + - - 1 + - 92.3855 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 5056 + - - 18 + - 4128.06 + - - - 704 + - 704 + - 1 + - 128 + - 704 + - 704 + - 704 + - 704 + - - 3 + - 700.517 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 2944 + - - 7 + - 3898.96 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 4 + - - 26 + - 258.358 + - - - 6784 + - 4288 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 4288 + - - 0 + - 2673.08 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 704 + - - 18 + - 3830.72 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 4 + - 4 + - - 27 + - 0.0992248 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 6784 + - - 10 + - 4409.46 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 128 + - - 14 + - 497.629 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1856 + - - 17 + - 4223.43 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 2927.15 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 2944 + - - 17 + - 4199.12 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 4288 + - - 18 + - 4149.93 + - - - 128 + - 1856 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1856 + - - 3 + - 369.396 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 5888 + - - 10 + - 4360.42 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 5888 + - - 4 + - 3565.61 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1856 + - - 17 + - 4106.84 + - - - 128 + - 2368 + - 1 + - 128 + - 128 + - 128 + - 128 + - 2368 + - - 3 + - 449.459 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1408 + - - 18 + - 3990.43 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 2944 + - - 10 + - 4228.67 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 2368 + - - 4 + - 4100.37 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4288 + - - 18 + - 2549.15 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 4288 + - - 17 + - 4221.65 + - - - 5888 + - 128 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 1 + - 888.624 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3584 + - - 4 + - 3882.04 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1856 + - - 4 + - 3463.89 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 448 + - 5056 + - - 18 + - 3625.35 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1856 + - - 18 + - 3275.04 + - - - 4 + - 3584 + - 1 + - 128 + - 4 + - 4 + - 4 + - 3584 + - - 24 + - 32.3068 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1408 + - - 31 + - 122.009 + - - - 256 + - 2368 + - 1 + - 128 + - 256 + - 256 + - 256 + - 2368 + - - 1 + - 732.025 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 2944 + - - 10 + - 4146.13 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 6784 + - - 10 + - 4364.3 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 128 + - 6784 + - - 18 + - 2542.29 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 64 + - 5056 + - - 7 + - 2282.44 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 5056 + - - 10 + - 4106.76 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 704 + - - 18 + - 3427.21 + - - - 2368 + - 4288 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 4288 + - - 1 + - 2346.73 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 4 + - 6784 + - - 29 + - 99.3538 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5888 + - - 18 + - 2693.16 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 448 + - - 4 + - 3668.9 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 448 + - - 4 + - 3601.24 + - - - 4 + - 704 + - 1 + - 128 + - 4 + - 4 + - 4 + - 704 + - - 25 + - 6.32815 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1856 + - - 18 + - 4061.62 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 2944 + - - 4 + - 3714.63 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1408 + - - 10 + - 4141.17 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1408 + - - 18 + - 3321.05 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1024 + - - 13 + - 3807.84 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1024 + - - 18 + - 2378.06 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 5888 + - - 4 + - 3035.25 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 2368 + - - 10 + - 4106.78 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3584 + - - 17 + - 4111.9 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 2368 + - - 7 + - 4162.42 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 2944 + - - 7 + - 3682.23 + - - - 1024 + - 256 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 256 + - - 3 + - 397.188 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 2368 + - - 4 + - 3410.77 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 4 + - 4288 + - - 27 + - 158.022 + - - - 5056 + - 1408 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 1408 + - - 1 + - 2206.11 + - - - 1408 + - 64 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 64 + - - 3 + - 155.198 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 6784 + - - 10 + - 4326.23 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 4 + - - 28 + - 0.664939 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1408 + - - 7 + - 1959.72 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1408 + - - 18 + - 3914.63 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1024 + - - 15 + - 1350.82 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1024 + - - 7 + - 2965.67 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 5888 + - - 7 + - 3203.15 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 3584 + - - 4 + - 3683.17 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1408 + - - 28 + - 64.3657 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 704 + - - 18 + - 3000.35 + - - - 1024 + - 128 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 3 + - 217.999 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 704 + - 448 + - - 7 + - 2231.22 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 448 + - - 4 + - 3661.0 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 128 + - - 7 + - 1524.35 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 256 + - 3584 + - - 4 + - 3395.54 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 448 + - 3584 + - - 18 + - 2731.54 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 256 + - - 18 + - 2832.88 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1856 + - - 7 + - 2300.2 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 2944 + - - 10 + - 4303.65 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1856 + - - 18 + - 3877.93 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 3584 + - - 10 + - 3871.18 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 2944 + - - 4 + - 3705.46 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 448 + - 128 + - - 7 + - 531.373 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 704 + - - 7 + - 3091.13 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 5056 + - - 27 + - 354.839 + - - - 64 + - 4 + - 1 + - 128 + - 64 + - 64 + - 64 + - 4 + - - 25 + - 0.615946 + - - - 5056 + - 448 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 448 + - - 1 + - 1577.08 + - - - 64 + - 5888 + - 1 + - 128 + - 64 + - 64 + - 64 + - 5888 + - - 3 + - 523.833 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 5056 + - - 17 + - 4123.63 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1024 + - - 17 + - 3604.78 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 704 + - - 7 + - 2696.88 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1856 + - - 18 + - 4007.26 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 604.948 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1856 + - - 7 + - 2542.53 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 128 + - - 7 + - 2534.06 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 5056 + - - 17 + - 4106.94 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 4 + - - 30 + - 221.927 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 1914.97 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 5888 + - - 18 + - 3954.83 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 128 + - - 7 + - 3874.94 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 64 + - - 9 + - 2566.05 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 2944 + - - 10 + - 4295.21 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 64 + - 5888 + - - 7 + - 2658.04 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 2944 + - - 18 + - 3684.16 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1408 + - - 18 + - 3964.21 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 18 + - 2981.91 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 448 + - - 16 + - 687.467 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 3584 + - - 20 + - 3467.39 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1408 + - - 18 + - 4066.8 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 256 + - - 4 + - 3403.34 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 2368 + - - 18 + - 3993.31 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 64 + - - 7 + - 1088.1 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1024 + - - 13 + - 3701.79 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 3584 + - - 10 + - 4046.01 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1408 + - - 7 + - 2930.68 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1408 + - - 18 + - 4185.7 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1408 + - - 18 + - 3911.48 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 2368 + - - 4 + - 3656.94 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 4288 + - - 17 + - 4350.7 + - - - 4288 + - 2368 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 2368 + - - 1 + - 2350.8 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 704 + - 4288 + - - 7 + - 3613.47 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1408 + - - 4 + - 1992.6 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 1235.38 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 448 + - - 5 + - 751.612 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 4288 + - - 20 + - 4328.85 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 4 + - - 28 + - 182.754 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 3584 + - - 7 + - 3720.27 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 4 + - 448 + - - 30 + - 9.36993 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 448 + - 5888 + - - 18 + - 3352.28 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3584 + - - 20 + - 4163.88 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 4288 + - - 18 + - 3972.85 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 4 + - - 31 + - 48.6052 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 704 + - - 18 + - 3502.51 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 4 + - 448 + - - 28 + - 24.4364 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 448 + - - 7 + - 672.164 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 448 + - - 18 + - 2538.89 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 5056 + - - 7 + - 2613.88 + - - - 4 + - 2944 + - 1 + - 128 + - 4 + - 4 + - 4 + - 2944 + - - 25 + - 26.8401 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 704 + - - 16 + - 603.621 + - - - 1856 + - 3584 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 3584 + - - 0 + - 2189.48 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 18 + - 2672.27 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 4 + - - 28 + - 84.4436 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 448 + - 4288 + - - 18 + - 3766.71 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 64 + - - 15 + - 1227.43 + - - - 704 + - 256 + - 1 + - 128 + - 704 + - 704 + - 704 + - 256 + - - 3 + - 302.262 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 4 + - - 28 + - 28.4941 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5056 + - - 18 + - 2927.12 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 704 + - - 18 + - 3988.26 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 64 + - - 19 + - 1144.93 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 4 + - - 27 + - 209.371 + - - - 64 + - 704 + - 1 + - 128 + - 64 + - 64 + - 64 + - 704 + - - 3 + - 69.7866 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 3584 + - - 17 + - 3866.47 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 704 + - - 4 + - 2153.94 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 128 + - - 16 + - 419.43 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 4288 + - - 4 + - 3776.96 + - - - 1408 + - 448 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 448 + - - 3 + - 856.026 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1856 + - - 4 + - 3799.76 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 128 + - 2368 + - - 7 + - 2139.56 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1856 + - - 4 + - 3641.63 + - - - 2944 + - 2368 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 2368 + - - 1 + - 2182.4 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 64 + - 128 + - - 15 + - 51.7049 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 128 + - 64 + - - 14 + - 80.0847 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 6784 + - - 10 + - 4175.93 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 128 + - - 7 + - 747.648 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1024 + - - 20 + - 4157.98 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 256 + - - 7 + - 1941.81 + - - - 1024 + - 4 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 4 + - - 25 + - 9.55344 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 2368 + - - 18 + - 4019.02 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1024 + - - 20 + - 3915.08 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 704 + - 448 + - - 15 + - 1635.74 + - - - 4 + - 4288 + - 1 + - 128 + - 4 + - 4 + - 4 + - 4288 + - - 25 + - 38.4362 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 2944 + - - 18 + - 3914.16 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 448 + - 4288 + - - 18 + - 3411.36 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1408 + - - 7 + - 1623.03 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 4 + - - 28 + - 92.8648 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 3584 + - - 10 + - 4087.28 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 4 + - - 28 + - 126.918 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1408 + - - 4 + - 3333.04 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 5888 + - - 10 + - 4186.47 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1856 + - - 7 + - 3920.22 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 3584 + - - 10 + - 3797.02 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 448 + - - 4 + - 3698.96 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 4288 + - - 18 + - 3913.84 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 635.551 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 128 + - - 7 + - 1843.83 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1024 + - - 20 + - 3956.24 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 3584 + - - 4 + - 3815.84 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 4 + - - 28 + - 120.394 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 5888 + - - 4 + - 3142.02 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 704 + - - 20 + - 3754.17 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 4288 + - - 18 + - 4043.43 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 5056 + - - 18 + - 4118.79 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 5888 + - - 10 + - 4234.81 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 4 + - - 26 + - 89.7219 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 64 + - 2944 + - - 4 + - 1673.26 + - - - 256 + - 4288 + - 1 + - 128 + - 256 + - 256 + - 256 + - 4288 + - - 1 + - 1059.97 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1024 + - - 18 + - 2901.72 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 5888 + - - 20 + - 4413.53 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 4 + - - 28 + - 180.727 + - - - 4288 + - 256 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 256 + - - 1 + - 1092.95 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 128 + - - 7 + - 2040.33 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 5056 + - - 10 + - 4265.22 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 4288 + - - 17 + - 4100.33 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 64 + - 3584 + - - 7 + - 1229.49 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 6784 + - - 10 + - 4374.0 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1408 + - - 7 + - 3717.89 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1856 + - - 4 + - 4119.35 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 5056 + - - 18 + - 4069.48 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 64 + - - 15 + - 389.805 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 704 + - - 18 + - 3221.88 + - - - 3584 + - 2368 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 2368 + - - 0 + - 2305.45 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 6784 + - - 18 + - 4073.09 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 5888 + - - 20 + - 4158.91 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 128 + - - 18 + - 2277.36 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 5888 + - - 18 + - 3944.64 + - - - 256 + - 704 + - 1 + - 128 + - 256 + - 256 + - 256 + - 704 + - - 3 + - 295.752 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 4 + - 5888 + - - 27 + - 195.758 + - - - 1856 + - 5056 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 5056 + - - 0 + - 2302.46 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 2944 + - - 18 + - 3542.75 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 64 + - 256 + - - 7 + - 150.657 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1419.74 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1024 + - - 18 + - 3710.99 + - - - 704 + - 5888 + - 1 + - 128 + - 704 + - 704 + - 704 + - 5888 + - - 1 + - 1948.37 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 2944 + - - 10 + - 4226.01 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 64 + - - 9 + - 1970.18 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 6784 + - - 10 + - 4370.09 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 2744.47 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1856 + - - 10 + - 4075.23 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1856 + - - 4 + - 3598.24 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 64 + - - 7 + - 3009.28 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 4 + - - 28 + - 211.534 + - - - 5888 + - 64 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 64 + - - 3 + - 551.63 + - - - 128 + - 6784 + - 1 + - 128 + - 128 + - 128 + - 128 + - 6784 + - - 1 + - 998.823 + - - - 64 + - 2944 + - 1 + - 128 + - 64 + - 64 + - 64 + - 2944 + - - 3 + - 309.831 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 6784 + - - 10 + - 4276.65 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 4 + - - 28 + - 67.3416 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1024 + - - 18 + - 3114.05 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 64 + - 4288 + - - 15 + - 1423.31 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 3584 + - - 7 + - 3652.59 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1408 + - - 18 + - 3664.19 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 448 + - - 18 + - 3368.74 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1408 + - - 18 + - 3186.28 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 448 + - 256 + - - 7 + - 1064.8 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4 + - - 31 + - 5.841 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 704 + - - 21 + - 3164.76 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 4288 + - - 17 + - 4291.33 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 64 + - - 15 + - 1405.09 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1856 + - - 7 + - 3677.4 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 4 + - - 28 + - 11.0818 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 3584 + - - 17 + - 4209.17 + - - - 2368 + - 256 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 256 + - - 3 + - 808.277 + - - - 1408 + - 128 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 3 + - 304.819 + - - - 448 + - 2368 + - 1 + - 128 + - 448 + - 448 + - 448 + - 2368 + - - 1 + - 1054.93 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 64 + - 5056 + - - 7 + - 1607.87 + - - - 3584 + - 1024 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 1024 + - - 0 + - 1824.74 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 704 + - - 4 + - 3776.44 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 4 + - - 28 + - 68.489 + - - - 256 + - 6784 + - 1 + - 128 + - 256 + - 256 + - 256 + - 6784 + - - 1 + - 1435.29 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1408 + - - 7 + - 3736.07 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 5888 + - - 17 + - 4115.57 + - - - 2368 + - 5056 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 5056 + - - 0 + - 2383.21 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1024 + - - 4 + - 2242.02 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 128 + - - 19 + - 1111.51 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 2944 + - - 10 + - 3834.15 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 128 + - - 7 + - 3193.63 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 6784 + - - 10 + - 4178.48 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 128 + - - 7 + - 2794.79 + - - - 1408 + - 4288 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 4288 + - - 1 + - 2123.08 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 128 + - 256 + - - 7 + - 306.601 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 15 + - 1296.54 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 448 + - - 18 + - 3357.61 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 2368 + - - 18 + - 4116.64 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 64 + - 2368 + - - 7 + - 1372.55 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 128 + - - 16 + - 761.11 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 6784 + - - 17 + - 4193.89 + - - - 2944 + - 6784 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 6784 + - - 0 + - 2565.87 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 704 + - 704 + - - 7 + - 1574.95 + - - - 5888 + - 4288 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 4288 + - - 0 + - 2655.04 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 6784 + - - 10 + - 4339.4 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 2368 + - - 18 + - 4127.46 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 64 + - - 7 + - 691.107 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2368 + - - 7 + - 1907.44 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 64 + - - 28 + - 10.779 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 4288 + - - 18 + - 3960.64 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 4288 + - - 9 + - 2403.45 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 64 + - 704 + - - 15 + - 277.268 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 2368 + - - 18 + - 3444.06 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 64 + - - 4 + - 2416.76 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 128 + - - 9 + - 2229.35 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 4288 + - - 18 + - 4119.95 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 448 + - 3584 + - - 7 + - 3376.58 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 5056 + - - 18 + - 4105.8 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1408 + - - 9 + - 2152.55 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 4 + - - 28 + - 46.2985 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1856 + - - 4 + - 3310.09 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 704 + - - 18 + - 4066.38 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 448 + - - 4 + - 3161.54 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1024 + - - 28 + - 133.853 + - - - 5056 + - 6784 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 6784 + - - 0 + - 2650.05 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1408 + - - 18 + - 4011.33 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 64 + - - 14 + - 267.105 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 448 + - 5056 + - - 18 + - 3308.21 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 448 + - - 7 + - 3300.01 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 128 + - 4288 + - - 4 + - 2374.54 + - - - 64 + - 1856 + - 1 + - 128 + - 64 + - 64 + - 64 + - 1856 + - - 3 + - 200.903 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 448 + - 704 + - - 15 + - 1617.39 + - - - 1024 + - 704 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 704 + - - 1 + - 863.348 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 2368 + - - 18 + - 3858.51 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 448 + - - 4 + - 3970.16 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 18 + - 2595.94 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 3584 + - - 17 + - 4197.7 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 18 + - 2575.32 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 448 + - 2944 + - - 18 + - 3018.97 + - - - 704 + - 4 + - 1 + - 128 + - 704 + - 704 + - 704 + - 4 + - - 25 + - 6.73489 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 6784 + - - 10 + - 4438.7 + - - - 3584 + - 64 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 64 + - - 3 + - 356.659 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1856 + - - 18 + - 3839.48 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 128 + - - 7 + - 2082.79 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 448 + - - 18 + - 3786.05 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 3584 + - - 27 + - 230.861 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 448 + - 2368 + - - 7 + - 3014.0 + - - - 448 + - 128 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 3 + - 96.0737 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 64 + - 5888 + - - 7 + - 1838.2 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 5056 + - - 27 + - 281.204 + - - - 5888 + - 4 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 4 + - - 25 + - 53.3006 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 3584 + - - 20 + - 3925.59 + - - - 6784 + - 1856 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 1856 + - - 0 + - 2488.06 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 5056 + - - 4 + - 3864.28 + - - - 2368 + - 1408 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 1408 + - - 1 + - 1847.81 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 2944 + - - 18 + - 3837.0 + - - - 4 + - 5888 + - 1 + - 128 + - 4 + - 4 + - 4 + - 5888 + - - 25 + - 53.3006 + - - - 3584 + - 704 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 704 + - - 0 + - 1617.39 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 64 + - 6784 + - - 7 + - 2121.17 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 6784 + - - 10 + - 4184.16 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 5888 + - - 17 + - 4400.03 + - - - 5056 + - 1856 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 1856 + - - 0 + - 2343.06 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 5056 + - - 10 + - 4207.39 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 4288 + - - 10 + - 4239.34 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 2368 + - - 18 + - 4166.18 + - - - 5056 + - 704 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 704 + - - 0 + - 1811.41 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 448 + - - 7 + - 2158.31 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 448 + - 6784 + - - 18 + - 3373.41 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 5888 + - - 4 + - 3950.3 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 4 + - - 28 + - 21.0051 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 3262.14 + - - - 704 + - 2944 + - 1 + - 128 + - 704 + - 704 + - 704 + - 2944 + - - 1 + - 1424.45 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 4 + - - 28 + - 104.639 + - - - 6784 + - 448 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 448 + - - 1 + - 1754.25 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1856 + - - 20 + - 4114.19 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 2368 + - - 17 + - 3927.57 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 2368 + - - 18 + - 4063.18 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 6784 + - - 20 + - 3960.15 +- null diff --git a/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml new file mode 100644 index 000000000..745f43300 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml @@ -0,0 +1,18412 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 64 + LSCB: 8 + LSPA: 4 + LSPB: 32 + LVCA: 16 + LVCB: 2 + LVPA: 1 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 1024 + LdsOffsetA: 0 + LdsOffsetB: 512 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x8_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 16 + LSPA: 8 + LSPB: 16 + LVCA: 8 + LVCB: 4 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x32x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 8 + LSPA: 8 + LSPB: 32 + LVCA: 8 + LVCB: 2 + LVPA: 2 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 1792 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 256 + LdsOffsetB_Blk: 1280 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x64x8_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 64 + LSCB: 8 + LSPA: 4 + LSPB: 32 + LVCA: 16 + LVCB: 2 + LVPA: 1 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 1792 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 256 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x8_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU8_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x64x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 8 + LSPA: 2 + LSPB: 32 + LVCA: 128 + LVCB: 8 + LVPA: 2 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 8 + LSPA: 4 + LSPB: 32 + LVCA: 64 + LVCB: 8 + LVPA: 4 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 9 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 10 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 8 + LSPA: 8 + LSPB: 32 + LVCA: 32 + LVCB: 8 + LVPA: 8 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 256 + LdsOffsetA: 0 + LdsOffsetA_Blk: 512 + LdsOffsetB: 256 + LdsOffsetB_Blk: 768 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 11 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x32x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 12 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x128x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 4 + LSPB: 16 + LVCA: 64 + LVCB: 16 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 13 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x16_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 8 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 14 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x64x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 15 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 8 + LSPA: 8 + LSPB: 32 + LVCA: 32 + LVCB: 8 + LVPA: 8 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 256 + LdsOffsetA: 0 + LdsOffsetA_Blk: 512 + LdsOffsetB: 256 + LdsOffsetB_Blk: 768 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 16 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x32x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 17 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 8 + LSPA: 8 + LSPB: 128 + LVCA: 32 + LVCB: 2 + LVPA: 2 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 18 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x128x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 8 + LSPA: 4 + LSPB: 32 + LVCA: 64 + LVCB: 8 + LVPA: 4 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 19 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 2 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 4 + LSPA: 4 + LSPB: 16 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 20 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT16x16x4_SE_AMAS2_GRVW2_GSU1_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 4 + LSPA: 4 + LSPB: 16 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 21 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT16x16x4_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 22 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 23 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU4_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 24 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU8_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 25 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 26 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 39.3642 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4148.36 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4141.24 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4378.86 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 2352.57 + - - - 256 + - 1856 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 566.059 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 3523.35 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3995.42 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4359.77 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4346.04 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 3978.89 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3629.13 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3966.27 + - - - 448 + - 256 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 165.764 + - - - 4 + - 2944 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 27.2674 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 23 + - 99.9254 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 3976.72 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3528.86 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 39.961 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 24 + - 93.5274 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 1106.68 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4171.94 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3639.65 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1297.17 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 2622.29 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 65.341 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 3218.49 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 18 + - 3755.41 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 495.056 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4461.2 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 14 + - 3094.35 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4145.09 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3864.15 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 5 + - 249.844 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 16 + - 1329.78 + - - - 3584 + - 4 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 20 + - 32.3523 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 2345.97 + - - - 5888 + - 448 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1423.93 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4439.33 + - - - 6784 + - 2368 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2220.39 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3947.86 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 24.7172 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 2112.24 + - - - 1408 + - 1024 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1158.65 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 3849.86 + - - - 256 + - 6784 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 4 + - 1291.23 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 14 + - 3495.93 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 26 + - 101.342 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 1271.77 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3546.14 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3935.55 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3944.24 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4127.22 + - - - 704 + - 128 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 132.884 + - - - 5056 + - 4 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 20 + - 45.1937 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 2893.12 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4278.74 + - - - 3584 + - 1024 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 1605.26 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 23 + - 60.3621 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4178.75 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4276.36 + - - - 4288 + - 1024 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 3 + - 1766.53 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 21.3472 + - - - 128 + - 448 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 84.6406 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4300.5 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4416.4 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 65.5694 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 19 + - 2812.03 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 22 + - 158.641 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4160.45 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 6 + - 3209.78 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 18 + - 3848.87 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3625.97 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 73.0438 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 3278.28 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4292.92 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 2943.86 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 3706.58 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 12 + - 3301.71 + - - - 1024 + - 3584 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 0 + - 1616.3 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 1495.38 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 3830.45 + - - - 4288 + - 6784 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2429.72 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 1553.95 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 1775.29 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 26 + - 9.55733 + - - - 6784 + - 4288 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 2377.59 + - - - 1856 + - 128 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 1 + - 346.183 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 135.234 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4349.99 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 25 + - 151.063 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 3.21886 + - - - 128 + - 5056 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 704.401 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2829.71 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3600.97 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 5 + - 408.618 + - - - 256 + - 704 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 258.154 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 18 + - 4157.3 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 23 + - 138.875 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4203.55 + - - - 704 + - 2944 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 1300.95 + - - - 1408 + - 4288 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1839.3 + - - - 448 + - 6784 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 0 + - 1549.64 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 0.0975238 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 13 + - 271.652 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4388.28 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 97.8807 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4382.68 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 3797.64 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 3968.1 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 14 + - 3953.56 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 23 + - 114.655 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 1781.3 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4428.42 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 6 + - 3798.7 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 14 + - 4183.52 + - - - 704 + - 4 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 20 + - 6.61621 + - - - 64 + - 64 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 2 + - 4.36035 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 80.2595 + - - - 1856 + - 704 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 1114.99 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 3858.52 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 13 + - 732.876 + - - - 128 + - 128 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 26.5866 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 6 + - 2114.45 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 3203.57 + - - - 1408 + - 64 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 135.634 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3906.42 + - - - 5888 + - 128 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 1 + - 889.935 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 3342.88 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4165.82 + - - - 5056 + - 1024 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 3 + - 1808.68 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 13 + - 450.388 + - - - 6784 + - 5888 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 2462.27 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4447.72 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 563.751 + - - - 3584 + - 6784 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 2150.84 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4496.73 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 3243.21 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 23 + - 210.041 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 18 + - 3774.26 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3927.19 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 26 + - 181.189 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4209.42 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 10 + - 3117.73 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 23 + - 157.418 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 16 + - 140.184 + - - - 128 + - 4288 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 578.894 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3493.17 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4340.86 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 26 + - 4.38075 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 10 + - 3334.59 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 6 + - 3135.25 + - - - 3584 + - 5056 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 2084.49 + - - - 4288 + - 128 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 1 + - 655.849 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3755.13 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 516.771 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 2670.14 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 16 + - 1180.07 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4437.93 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 10 + - 3173.32 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3263.61 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 1769.85 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 202.038 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 6 + - 2413.33 + - - - 64 + - 448 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 41.9718 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 3835.24 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 13 + - 495.948 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 3972.23 + - - - 448 + - 1024 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 620.984 + - - - 4 + - 2368 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 21.9961 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 2690.8 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3930.42 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 23 + - 248.798 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 18 + - 3950.24 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 3832.07 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 10 + - 2942.24 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4047.77 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 10 + - 3152.45 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 6 + - 3149.26 + - - - 1856 + - 5888 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 2094.77 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 105.703 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 71.2817 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3975.85 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 8 + - 2131.59 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 24 + - 7.86612 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4294.26 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 13 + - 961.688 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4222.89 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3188.17 + - - - 4 + - 4288 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 39.487 + - - - 5888 + - 3584 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2215.93 + - - - 2944 + - 1856 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 1801.47 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 10 + - 3608.14 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3600.47 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 10 + - 3588.68 + - - - 2944 + - 5888 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2232.72 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 3020.64 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 13 + - 393.292 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 23 + - 173.349 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 9 + - 1733.22 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 15 + - 1336.9 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 6 + - 2914.61 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2076.84 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 2823.23 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4322.48 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 10 + - 2184.53 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 2915.69 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 10 + - 2959.69 + - - - 4288 + - 4288 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 2273.68 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4245.39 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 10.6603 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 2470.53 + - - - 64 + - 704 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 68.0091 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 2846.6 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4304.64 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 3915.62 + - - - 64 + - 1856 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 173.249 + - - - 1024 + - 2368 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1325.5 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 90.7877 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 6 + - 3329.39 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 2678.84 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 3695.81 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 2688.39 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4392.89 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 6 + - 1744.98 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 17 + - 2494.4 + - - - 2368 + - 5056 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2146.35 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4221.01 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 3916.54 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 976.068 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4392.5 + - - - 2368 + - 5888 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2196.37 + - - - 448 + - 5888 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 3 + - 1587.85 + - - - 5888 + - 5056 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 2304.61 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 3644.58 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 10 + - 3128.24 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 1993.93 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 14 + - 3564.64 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 201.514 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 17.9797 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 3717.36 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4171.27 + - - - 4 + - 3584 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 32.9566 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 3919.12 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 2831.87 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4244.99 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4410.19 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 10 + - 3108.37 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 2749.61 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 1240.16 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1864.53 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 2205.8 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3329.61 + - - - 1408 + - 3584 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1709.88 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 2436.09 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4242.39 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4521.32 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 3915.63 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4461.97 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 2469.07 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 16 + - 998.273 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 11 + - 276.205 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 2617.02 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 1499.64 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 4060.31 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 657.709 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 15.0542 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 6 + - 2840.92 + - - - 6784 + - 64 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 1 + - 530.696 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 10 + - 3206.42 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4440.8 + - - - 3584 + - 448 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1272.42 + - - - 2944 + - 64 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 266.077 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4151.19 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2438.61 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 14 + - 3926.02 + - - - 128 + - 1024 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 192.223 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4295.68 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 10 + - 2676.72 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3552.7 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4144.37 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 4.25927 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4226.4 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 25 + - 50.5815 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 6 + - 3583.98 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3932.54 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 3876.18 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 3975.39 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 22 + - 201.474 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4303.81 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 18 + - 3948.45 + - - - 2944 + - 1408 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 1626.35 + - - - 128 + - 1856 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 340.905 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 561.737 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3415.51 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 10 + - 2575.28 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 2747.73 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 3696.24 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3530.4 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4233.41 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 6 + - 1706.87 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 2627.96 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3763.53 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 14 + - 3897.5 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 6 + - 1855.11 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4059.38 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 10 + - 3584.42 + - - - 4288 + - 1856 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 1994.62 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 12 + - 3890.5 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4239.18 + - - - 1024 + - 64 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 98.4578 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 3142.6 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 2056.9 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4506.24 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4184.67 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 11 + - 970.904 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 91.476 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3846.05 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 18 + - 3941.4 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 3595.46 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 2291.53 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4238.22 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 3586.47 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4354.21 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4417.73 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 6 + - 2720.28 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 6 + - 3541.9 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 6 + - 3540.4 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 14 + - 3855.64 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 6 + - 3623.32 + - - - 704 + - 1856 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 1113.8 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4235.17 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 17 + - 2476.9 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 2180.82 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 5 + - 418.915 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4489.82 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 3072.11 + - - - 2944 + - 128 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 529.817 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 7.81431 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 13 + - 608.718 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 18 + - 4044.3 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 6 + - 3246.72 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4082.81 + - - - 64 + - 256 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 25.1578 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 5 + - 159.566 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 392.725 + - - - 1024 + - 1856 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1374.72 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3578.29 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 23 + - 167.084 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 12 + - 3782.92 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 2953.84 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 11 + - 1221.3 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 24 + - 85.7646 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 14 + - 3822.29 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 14 + - 4035.35 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3622.28 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 105.703 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4212.77 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4118.16 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4303.36 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 15 + - 1379.2 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 10 + - 2825.13 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 6 + - 3716.14 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 10 + - 2978.52 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 521.444 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 22 + - 66.9038 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 7 + - 2534.09 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 23 + - 69.0395 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 2226.06 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 10 + - 2539.8 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3202.47 + - - - 5056 + - 448 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 1 + - 1353.3 + - - - 1024 + - 5888 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1719.9 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 6 + - 1010.03 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 10 + - 3609.36 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 12 + - 3814.24 + - - - 256 + - 4288 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 888.849 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4379.88 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3514.27 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 79.771 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 5 + - 76.9503 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 92.4762 + - - - 128 + - 2368 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 420.978 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1999.08 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 45.9277 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 5 + - 94.588 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 3517.46 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4316.26 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4312.31 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4191.83 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 6 + - 3782.12 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 2849.78 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 3779.48 + - - - 4288 + - 5888 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2406.56 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4211.53 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 3569.22 + - - - 448 + - 1408 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 746.49 + - - - 6784 + - 1024 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 1923.0 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 8 + - 2457.45 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3654.89 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3772.87 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 2880.86 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4418.24 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 6 + - 1439.07 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4417.68 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3951.13 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 16 + - 138.578 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 17 + - 2014.94 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 25 + - 25.2062 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 3597.68 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 3504.14 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 23 + - 41.3512 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 1284.63 + - - - 704 + - 5888 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 4 + - 1659.31 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 3887.89 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 81.5378 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 6 + - 3208.12 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4347.12 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4512.11 + - - - 448 + - 2368 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 939.337 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 11 + - 379.919 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 775.852 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 16 + - 1058.47 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3465.95 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 9.24903 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 492.84 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 6 + - 2224.25 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4385.55 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 16 + - 37.8092 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 10 + - 2250.46 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 10 + - 3429.53 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 13 + - 916.095 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4265.58 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4450.36 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 14 + - 3615.24 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 3868.07 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 246.862 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3836.6 + - - - 5056 + - 1408 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 4 + - 1943.71 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 24 + - 21.0466 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4084.72 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4518.51 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 3336.42 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 9 + - 1613.47 + - - - 1856 + - 1856 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 0 + - 1728.31 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 3295.03 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4397.48 + - - - 2944 + - 6784 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2257.53 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 3641.76 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4233.8 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4194.07 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 11 + - 989.223 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3771.56 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 1509.73 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4343.82 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 8 + - 2418.79 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 2832.56 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 6 + - 3533.44 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4380.48 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 777.945 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 14 + - 3929.17 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 6 + - 725.658 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3370.57 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 3903.04 + - - - 2368 + - 4288 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2041.26 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4414.07 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3757.27 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3982.92 + - - - 2944 + - 448 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 1108.91 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 15 + - 1124.25 + - - - 448 + - 704 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 443.433 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 25 + - 3.30323 + - - - 1408 + - 6784 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 2013.04 + - - - 256 + - 5888 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 4 + - 1154.49 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3292.65 + - - - 256 + - 3584 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 958.229 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 3416.79 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 6 + - 3384.32 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 3973.34 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 6 + - 1933.44 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 2332.89 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4230.03 + - - - 5888 + - 2368 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2132.33 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 6 + - 2615.92 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 14 + - 3438.0 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4243.46 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 23 + - 302.085 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 6 + - 1522.25 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 121.538 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 3345.79 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 18 + - 3273.88 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 25 + - 307.163 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 3218.49 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 3510.95 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4268.16 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 13 + - 1152.42 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 26 + - 47.7204 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 23 + - 214.8 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4060.66 + - - - 128 + - 2944 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 525.659 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 3013.8 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 15 + - 1432.97 + - - - 704 + - 1408 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 923.687 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 2731.29 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 3120.22 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4366.64 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 10 + - 2368.66 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4352.55 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1004.69 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 6 + - 3286.94 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 25 + - 1.76172 + - - - 64 + - 1024 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 99.297 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 3319.88 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 24 + - 116.381 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 273.585 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 10 + - 2666.68 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 10 + - 2224.84 + - - - 1024 + - 448 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 601.149 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 10 + - 3212.27 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2181.4 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 1299.12 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 1908.98 + - - - 4288 + - 4 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 20 + - 38.7619 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 14 + - 3832.99 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 15 + - 1038.99 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 2190.88 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3432.84 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 3870.09 + - - - 2944 + - 2368 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 1884.48 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 3727.33 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4358.94 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 24 + - 10.9677 + - - - 5888 + - 704 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1604.32 + - - - 448 + - 64 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 43.197 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 3534.46 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 6 + - 3293.39 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 10 + - 3103.89 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 23 + - 32.9956 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 2820.58 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4446.3 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 11 + - 344.926 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 11 + - 1547.79 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 6 + - 2000.91 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 3351.24 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4178.59 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3545.33 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4141.26 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4259.14 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 984.158 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 2913.52 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4297.31 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4477.42 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 67.2809 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 6 + - 3337.14 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 10 + - 3144.55 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 10 + - 3098.55 + - - - 1024 + - 6784 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1787.25 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4349.64 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 10 + - 3313.18 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 10 + - 3425.19 + - - - 4288 + - 5056 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2329.32 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 9 + - 1266.43 + - - - 1856 + - 1408 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 1568.34 + - - - 256 + - 5056 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 4 + - 996.122 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 26 + - 202.288 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 6 + - 2826.71 + - - - 128 + - 4 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 20 + - 1.23189 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 14 + - 3633.59 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4358.39 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 18 + - 3731.07 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4024.81 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4372.03 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4060.18 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 10 + - 2647.14 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 18 + - 3947.28 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4492.65 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 18 + - 3960.85 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4383.11 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 6 + - 2070.53 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 3467.13 + - - - 4288 + - 2944 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 2180.76 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4086.64 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 564.256 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3691.13 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 3987.26 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 9 + - 2531.63 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3372.86 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 3945.45 + - - - 2944 + - 3584 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2092.22 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 1460.74 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 6 + - 1849.25 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 282.889 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4195.95 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 16 + - 814.654 + - - - 5888 + - 6784 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 2353.9 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 2552.92 + - - - 64 + - 128 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 12.1814 + - - - 1856 + - 64 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 1 + - 168.637 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 979.146 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 4112.19 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 8 + - 3172.45 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 6 + - 1523.51 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 10 + - 2662.93 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 1486.98 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 1708.47 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 22 + - 332.409 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 4138.04 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 2614.24 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 2441.02 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4056.55 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 8 + - 3024.66 + - - - 4288 + - 448 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 1515.6 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 3160.85 + - - - 4 + - 5056 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 46.6264 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 12 + - 3921.5 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4348.85 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 3309.52 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4235.52 + - - - 128 + - 3584 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 539.708 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 24 + - 183.04 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 3464.05 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 26 + - 48.6052 + - - - 5888 + - 2944 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2187.64 + - - - 704 + - 4288 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 0 + - 1607.32 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 1706.16 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 22 + - 281.542 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2316.59 + - - - 2944 + - 5056 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2208.65 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4499.82 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3518.86 + - - - 1408 + - 5056 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1909.5 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1775.3 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4379.72 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4407.8 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 12 + - 4012.21 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 3513.99 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3831.94 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 10 + - 3301.36 + - - - 704 + - 1024 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 848.113 + - - - 2944 + - 704 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 1280.36 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1559.3 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 10 + - 3462.9 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 5.68889 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 10 + - 3289.3 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4329.8 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 12 + - 3275.05 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4383.11 + - - - 256 + - 2368 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 664.793 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4146.56 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4314.91 + - - - 4288 + - 2368 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 3 + - 2044.34 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4227.47 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4017.22 + - - - 5056 + - 3584 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 4 + - 2242.14 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4308.74 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 2379.99 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4227.82 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 3798.69 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 0.668277 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3510.93 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 6 + - 3448.82 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 6 + - 2370.69 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 24 + - 155.855 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 2857.03 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 10 + - 2655.11 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2818.45 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4213.1 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 83.6475 + - - - 6784 + - 128 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 1 + - 1004.6 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 2831.61 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4297.78 + - - - 1024 + - 1408 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1159.23 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 23 + - 185.328 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4432.48 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 386.928 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4289.42 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 24 + - 99.6136 + - - - 4 + - 448 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 3.9385 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4357.62 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4357.97 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 24.487 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 10 + - 3368.68 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 3911.17 + - - - 4288 + - 704 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 1564.63 + - - - 2368 + - 2944 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 1937.85 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 6 + - 668.03 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 18 + - 4099.15 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 26 + - 13.8209 + - - - 64 + - 4 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 20 + - 0.605028 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4208.25 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 10 + - 3571.36 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 10 + - 3114.19 + - - - 5888 + - 256 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1215.59 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 3113.73 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 10 + - 2792.9 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3333.13 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 10 + - 2753.42 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4383.9 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 153.553 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 205.201 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 10 + - 2245.55 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3384.11 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4458.04 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4394.43 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 14 + - 3195.11 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 12 + - 4090.84 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 2964.02 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 774.463 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4395.23 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3946.17 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4313.43 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 66.8912 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4439.79 + - - - 2944 + - 256 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 873.813 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 2834.46 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 5 + - 168.969 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 178.305 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 3954.41 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 3263.15 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 2851.29 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 13 + - 1168.22 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3669.02 + - - - 448 + - 3584 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 4 + - 1312.06 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 3304.19 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3435.51 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 4133.74 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 6 + - 1745.1 + - - - 3584 + - 2368 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1889.39 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4354.77 + - - - 448 + - 4 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 20 + - 4.29226 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 10 + - 3408.71 + - - - 5056 + - 5056 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2404.96 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 26 + - 70.9441 + - - - 4 + - 1408 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 12.1774 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 14 + - 3925.26 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 2570.26 + - - - 5888 + - 1856 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2049.11 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4390.38 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 2155.66 + - - - 4 + - 4 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 21 + - 0.0286676 + - - - 2944 + - 4288 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2134.89 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 3803.64 + - - - 1024 + - 1024 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 866.144 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3725.14 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4372.9 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 13 + - 260.47 + - - - 5888 + - 4288 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2264.76 + - - - 64 + - 6784 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 585.735 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3992.08 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4478.82 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 6 + - 1015.04 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 18 + - 3701.94 + - - - 256 + - 256 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 95.8479 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3589.75 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 51.3002 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4544.89 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1747.63 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 27.9046 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 31.9312 + - - - 6784 + - 3584 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2316.02 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 17 + - 2145.24 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 24 + - 28.672 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3364.63 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4476.55 + - - - 4 + - 128 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 1.17197 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4269.62 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 2314.09 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 14 + - 4220.95 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 26 + - 183.585 + - - - 704 + - 448 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 453.801 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3807.34 + - - - 2368 + - 4 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 20 + - 21.4361 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3895.64 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4287.55 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 1927.9 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4029.73 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 3801.8 + - - - 6784 + - 1856 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2147.51 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 2959.69 + - - - 128 + - 1408 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 260.722 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4279.73 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 3520.08 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4034.92 + - - - 3584 + - 1408 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1650.46 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 10 + - 3602.35 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 1765.2 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3762.52 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 13 + - 485.773 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 19.9805 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4093.62 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 139.81 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 26 + - 25.0047 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 10 + - 2779.78 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 3147.42 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4448.59 + - - - 4 + - 5888 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 53.8336 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4298.85 + - - - 6784 + - 2944 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2288.9 + - - - 4288 + - 64 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 1 + - 374.013 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 354.249 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 6 + - 1932.76 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 5 + - 82.957 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 6 + - 2049.21 + - - - 704 + - 256 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 255.864 + - - - 4 + - 6784 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 62.3822 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4453.78 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 11 + - 1083.06 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4460.72 + - - - 6784 + - 5056 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 2412.2 + - - - 128 + - 256 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 50.607 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 3608.74 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 10 + - 2333.17 + - - - 4 + - 704 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 6.29279 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3919.53 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 2805.59 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3345.29 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 3891.09 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 3841.0 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3679.21 + - - - 4 + - 1856 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 17.1407 + - - - 5056 + - 64 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 1 + - 450.204 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4414.96 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 3354.1 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4308.95 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 6 + - 2213.15 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 23 + - 197.314 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3458.02 + - - - 1856 + - 6784 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 2166.45 + - - - 1408 + - 1408 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 1265.74 + - - - 3584 + - 2944 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1982.16 + - - - 1856 + - 448 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 1 + - 964.743 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 278.137 + - - - 1408 + - 1856 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 3 + - 1469.15 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 101.606 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 26 + - 68.2667 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 10 + - 3113.41 + - - - 128 + - 5888 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 793.331 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 2241.21 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 24 + - 7.96629 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2855.9 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 646.13 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4456.48 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4314.93 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 5 + - 254.889 + - - - 6784 + - 256 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 1367.48 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 14 + - 4163.56 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3653.53 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 23 + - 277.644 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3905.3 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 1652.45 + - - - 1024 + - 2944 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 0 + - 1452.41 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3824.23 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1529.5 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4256.23 + - - - 256 + - 128 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 49.9322 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 23 + - 257.251 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 18 + - 3784.77 + - - - 448 + - 5056 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 3 + - 1384.85 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 1771.4 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4354.88 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 26 + - 0.258586 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4149.36 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4395.04 + - - - 4288 + - 256 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 1 + - 980.662 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 8 + - 2825.48 + - - - 1856 + - 2368 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 1764.62 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 25 + - 78.2549 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4169.52 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4196.45 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 3941.37 + - - - 2368 + - 1408 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 0 + - 1673.87 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 6 + - 511.274 + - - - 3584 + - 128 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 1 + - 617.328 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 24 + - 46.8935 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 1972.32 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 18 + - 4166.15 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 10 + - 2258.17 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4055.05 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 976.068 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 18 + - 3907.96 + - - - 64 + - 1408 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 136.018 + - - - 3584 + - 1856 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1802.99 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 656.492 + - - - 2368 + - 1024 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 1 + - 1443.35 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1011.63 + - - - 5056 + - 1856 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 3 + - 2068.94 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3057.03 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 1988.12 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 1958.09 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3729.29 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 12 + - 2827.75 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 1698.61 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 3081.05 + - - - 1024 + - 256 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 368.568 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 2212.84 + - - - 5056 + - 256 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 1 + - 1105.09 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4307.17 + - - - 1024 + - 704 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 809.427 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4089.26 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3964.03 + - - - 5888 + - 1408 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1889.8 + - - - 4 + - 1024 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 9.08968 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 1497.47 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 2887.39 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4313.99 + - - - 128 + - 6784 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 888.908 + - - - 1024 + - 4288 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1607.29 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4430.95 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4252.68 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4440.61 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 0.483019 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 13.5303 + - - - 3584 + - 256 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 1 + - 987.227 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4301.25 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3912.25 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 14.2824 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 16 + - 1083.47 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 2802.5 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 1832.62 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4445.82 + - - - 3584 + - 704 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1380.18 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 3960.92 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 3928.11 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 24 + - 40.6862 + - - - 2944 + - 2944 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2020.32 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 3316.93 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 10 + - 2537.65 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4173.27 + - - - 128 + - 704 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 135.38 + - - - 2368 + - 6784 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2227.32 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 1932.76 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4441.69 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1176.29 + - - - 2368 + - 2368 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 3 + - 1908.91 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4281.09 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 2028.1 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 14 + - 3775.18 + - - - 448 + - 128 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 85.1117 + - - - 1408 + - 704 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 911.478 + - - - 2368 + - 1856 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 3 + - 1764.18 + - - - 5888 + - 1024 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1792.11 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 22 + - 256.1 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 1838.74 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4370.84 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 819.2 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 6 + - 2963.69 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 2056.9 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 13 + - 799.97 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 3430.3 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 26 + - 83.6489 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4444.3 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 15 + - 988.864 + - - - 6784 + - 1408 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2051.69 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 35.4772 + - - - 448 + - 4288 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 2 + - 1480.56 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4492.91 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 10 + - 2803.87 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 23 + - 134.269 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 3721.65 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 18 + - 3981.68 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 3129.06 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 1106.68 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 18 + - 4021.73 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4307.56 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 2626.56 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 9 + - 2005.7 + - - - 1408 + - 448 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 728.704 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 13 + - 678.473 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3732.64 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4035.28 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 10 + - 3034.65 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 3625.11 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 24 + - 122.613 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2306.69 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 3392.45 + - - - 5888 + - 64 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 1 + - 519.768 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 14 + - 2709.8 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4325.34 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 2427.83 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 1490.22 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4534.05 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 17 + - 2087.38 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 25 + - 88.9804 + - - - 3584 + - 5888 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 2139.28 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4150.99 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 6 + - 3352.28 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1266.23 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3931.0 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 2301.23 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4183.12 + - - - 5056 + - 2944 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 4 + - 2225.15 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 24 + - 18.6447 + - - - 256 + - 64 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 26.7494 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4295.19 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 14 + - 3312.0 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 7 + - 2780.79 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 2825.6 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3471.1 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 10 + - 2493.68 + - - - 1024 + - 128 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 186.912 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4312.34 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 728.178 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 26 + - 15.3121 + - - - 64 + - 4288 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 388.233 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 16 + - 753.597 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4163.76 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4480.35 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 6 + - 2108.9 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4219.49 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 3246.18 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4540.43 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4088.55 + - - - 3584 + - 64 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 1 + - 319.967 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4199.65 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 2869.86 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 8 + - 2569.23 + - - - 5056 + - 5888 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2436.65 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 14 + - 3172.63 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 13 + - 433.369 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 24 + - 14.8176 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 23 + - 239.083 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4220.07 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4165.0 + - - - 3584 + - 3584 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 2017.09 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4106.91 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 24 + - 103.448 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4209.47 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 8 + - 2297.52 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4173.01 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 6 + - 3598.39 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 8 + - 2802.21 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 9 + - 2058.01 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 3766.7 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 2342.79 + - - - 2944 + - 4 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 20 + - 26.8019 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 1499.26 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 3399.41 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3105.04 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 1900.95 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 13 + - 267.105 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 23 + - 191.447 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4178.89 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 9 + - 1808.54 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 10 + - 3175.71 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 1299.12 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 24 + - 5.82025 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4199.28 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 26 + - 60.1415 + - - - 4288 + - 3584 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2240.67 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3319.92 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 10 + - 2378.29 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 3958.12 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4533.49 + - - - 4 + - 256 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 2.25677 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 3917.77 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 1836.6 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4457.63 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 3073.66 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3396.29 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 26 + - 69.3016 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3889.77 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 11 + - 1297.17 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 14 + - 3291.5 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 18 + - 3749.64 + - - - 5056 + - 4288 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2339.69 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 3421.93 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4168.41 + - - - 1856 + - 4 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 20 + - 16.8251 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 14 + - 3703.02 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4051.52 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4211.71 + - - - 2368 + - 3584 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2058.06 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 47.943 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 52.6394 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 5 + - 142.948 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4154.15 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4447.42 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 2466.98 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 2943.86 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4130.78 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 8 + - 2488.48 + - - - 704 + - 5056 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 0 + - 1731.03 + - - - 256 + - 2944 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 804.982 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4066.5 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 11 + - 521.444 + - - - 2368 + - 448 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 912.571 + - - - 64 + - 3584 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 327.973 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4466.21 + - - - 2368 + - 64 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 1 + - 217.474 + - - - 4288 + - 1408 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 1854.49 + - - - 5888 + - 4 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 20 + - 53.1503 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 2861.67 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 1176.29 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 777.246 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4483.23 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4207.54 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4421.63 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 2912.71 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 2789.1 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 3469.83 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 18 + - 3711.42 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2200.82 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4071.47 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4272.71 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 246.862 + - - - 64 + - 5888 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 523.833 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 7.81253 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 2222.79 + - - - 2368 + - 128 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 1 + - 432.619 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 2770.63 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4407.1 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 3801.9 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3955.03 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3800.56 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 2899.89 + - - - 6784 + - 704 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 1808.64 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 3895.38 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3749.73 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 3850.02 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3806.86 + - - - 1408 + - 256 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 505.449 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3583.09 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 11 + - 178.851 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 13 + - 784.191 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3400.28 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 1971.41 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 3965.04 + - - - 256 + - 4 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 20 + - 2.47121 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 3393.15 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 9 + - 1602.79 + - - - 1408 + - 2944 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1667.23 + - - - 1024 + - 5056 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1646.22 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 8 + - 2677.23 + - - - 1856 + - 2944 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 1884.97 + - - - 256 + - 448 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 169.125 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 3705.11 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 14 + - 3600.94 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 6 + - 1677.14 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 64.9846 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 16 + - 1013.31 + - - - 64 + - 2368 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 218.848 + - - - 1856 + - 4288 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 1990.26 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 3422.2 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3725.08 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 3267.57 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 3824.17 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4148.08 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 13 + - 665.6 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3676.17 + - - - 5056 + - 704 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 1751.25 + - - - 5888 + - 5888 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 2312.49 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 10 + - 3128.3 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4134.28 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4507.56 + - - - 256 + - 1408 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 495.036 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 1.64498 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 2790.75 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 18 + - 4096.69 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 16 + - 759.445 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 9 + - 1168.26 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3298.79 + - - - 6784 + - 448 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 1497.16 + - - - 1856 + - 1024 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 2 + - 1474.0 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4511.54 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 2968.67 + - - - 448 + - 448 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 295.969 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 3635.77 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2726.43 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 2913.74 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 10 + - 3065.9 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 18 + - 4020.09 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4397.37 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 2915.15 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 11 + - 831.846 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 9 + - 1522.22 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 387.926 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3371.93 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 3852.75 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4404.62 + - - - 1408 + - 2368 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 0 + - 1577.36 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 6 + - 2302.69 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 13 + - 771.012 + - - - 64 + - 5056 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 444.026 + - - - 6784 + - 6784 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 2506.43 + - - - 448 + - 1856 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 953.678 + - - - 2944 + - 1024 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 0 + - 1500.76 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4503.58 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 14 + - 3605.13 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 3689.58 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 14 + - 3359.31 + - - - 704 + - 704 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 653.201 + - - - 1408 + - 128 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 257.463 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4280.89 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 98.3595 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4264.67 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3619.73 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 3742.02 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 13 + - 645.303 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4554.14 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 4286.55 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 3949.42 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 6 + - 3040.87 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 8 + - 2484.44 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2436.49 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4556.72 + - - - 448 + - 2944 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 4 + - 1104.27 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 24 + - 135.664 + - - - 128 + - 64 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 13.2262 + - - - 1856 + - 256 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 1 + - 638.302 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 9 + - 1668.76 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 11 + - 1269.08 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 3324.54 + - - - 64 + - 2944 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 269.166 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 17 + - 1424.77 + - - - 5056 + - 2368 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 4 + - 2156.26 + - - - 704 + - 6784 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 3 + - 1897.57 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4408.12 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 3113.73 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 3208.42 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 1980.24 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 14 + - 3777.28 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 17 + - 1978.71 + - - - 3584 + - 4288 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 2061.81 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 15 + - 1569.93 + - - - 1408 + - 4 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 20 + - 13.0033 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3569.76 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 3289.18 + - - - 5056 + - 6784 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2459.99 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 2080.65 + - - - 1024 + - 4 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 20 + - 9.49806 + - - - 256 + - 1024 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 377.525 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 22 + - 302.117 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 1966.08 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 1724.12 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 56.5662 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 385.85 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 8 + - 2833.99 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4291.71 + - - - 1856 + - 5056 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 2068.94 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4183.09 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 10 + - 3156.62 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4256.21 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4363.46 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 24 + - 66.5006 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3583.54 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 10 + - 2659.99 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 14 + - 4152.69 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4389.23 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 6 + - 1981.12 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 6 + - 2786.16 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 24 + - 36.6806 + - - - 6784 + - 4 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 20 + - 61.2383 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 1775.94 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 3320.03 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3808.1 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 6 + - 1224.18 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4433.08 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 14 + - 2913.51 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 6 + - 3431.07 + - - - 4 + - 64 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 21 + - 0.472983 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 3948.3 + - - - 2368 + - 704 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 1356.72 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4348.69 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 9 + - 2017.03 + - - - 704 + - 3584 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 3 + - 1504.1 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 177.467 + - - - 1408 + - 5888 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1931.63 + - - - 1856 + - 3584 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 1990.85 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 211.1 + - - - 704 + - 2368 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 2 + - 1329.01 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4213.24 + - - - 704 + - 64 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 66.3198 + - - - 2368 + - 256 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 1 + - 724.912 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 3940.44 + - - - 5056 + - 128 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 1 + - 767.014 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 26 + - 179.961 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 3107.11 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 24 + - 211.533 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 6 + - 2182.47 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3459.77 +- null diff --git a/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml new file mode 100644 index 000000000..51a99cef5 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml @@ -0,0 +1,19013 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 64 + LSPA: 16 + LSPB: 4 + LVCA: 4 + LVCB: 16 + LVPA: 4 + LVPB: 1 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 4 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 32 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 32 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 4 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x32_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x64x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 64 + LSPA: 32 + LSPB: 4 + LVCA: 8 + LVCB: 64 + LVPA: 32 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 32 + LSPB: 2 + LVCA: 8 + LVCB: 128 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 16 + LSPB: 4 + LVCA: 16 + LVCB: 64 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 9 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x16_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 32 + LSPB: 2 + LVCA: 8 + LVCB: 128 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 10 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 11 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 12 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 13 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 14 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 64 + LSPA: 32 + LSPB: 4 + LVCA: 8 + LVCB: 64 + LVPA: 32 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 15 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 128 + LSPB: 8 + LVCA: 2 + LVCB: 32 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 16 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 32 + LSPA: 16 + LSPB: 8 + LVCA: 16 + LVCB: 32 + LVPA: 16 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 17 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x16_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 18 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 19 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU8_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 64 + LSPA: 32 + LSPB: 4 + LVCA: 8 + LVCB: 64 + LVPA: 32 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 20 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 21 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 2 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 4 + LSCB: 16 + LSPA: 16 + LSPB: 4 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 22 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT16x16x4_SE_AMAS2_GRVW2_GSU1_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 4 + LSCB: 16 + LSPA: 16 + LSPB: 4 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 23 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT16x16x4_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 24 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 25 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU4_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 26 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU8_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 27 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 28 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 29 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 4288 + - - 10 + - 2978.45 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 2944 + - - 14 + - 3351.31 + - - - 448 + - 2944 + - 1 + - 128 + - 448 + - 448 + - 128 + - 2944 + - - 3 + - 1047.28 + - - - 1024 + - 2368 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 2368 + - - 4 + - 1270.79 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 2944 + - - 14 + - 4391.66 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 704 + - - 8 + - 938.841 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 128 + - - 9 + - 768.705 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 704 + - - 21 + - 1992.91 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1024 + - - 25 + - 18.2044 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 5056 + - - 14 + - 3915.61 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 448 + - - 14 + - 2941.67 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 64 + - - 12 + - 1738.99 + - - - 128 + - 5056 + - 1 + - 128 + - 128 + - 128 + - 128 + - 5056 + - - 2 + - 695.88 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 704 + - - 14 + - 2849.99 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 5056 + - - 14 + - 4258.78 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 256 + - - 10 + - 3059.35 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1856 + - - 6 + - 3115.65 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 4288 + - - 14 + - 4273.47 + - - - 6784 + - 256 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 256 + - - 3 + - 1268.25 + - - - 704 + - 256 + - 1 + - 128 + - 704 + - 704 + - 128 + - 256 + - - 2 + - 261.668 + - - - 4288 + - 4 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 4 + - - 22 + - 39.5439 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 704 + - - 6 + - 3061.04 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 768 + - 2368 + - - 6 + - 2753.26 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1856 + - - 18 + - 4110.42 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 3584 + - - 14 + - 4400.95 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 17 + - 106.998 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 6784 + - - 14 + - 3002.41 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 5056 + - - 6 + - 3570.58 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 5056 + - - 16 + - 4197.09 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1024 + - - 14 + - 3594.01 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 6784 + - - 14 + - 4354.86 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3584 + - - 6 + - 3619.9 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 5056 + - - 14 + - 4282.46 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 128 + - - 21 + - 2379.11 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 3584 + - - 14 + - 4292.05 + - - - 1408 + - 2944 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 2944 + - - 3 + - 1549.95 + - - - 448 + - 3584 + - 1 + - 128 + - 448 + - 448 + - 128 + - 3584 + - - 3 + - 1223.34 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 3584 + - - 14 + - 3468.97 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 2368 + - - 14 + - 4166.69 + - - - 704 + - 3584 + - 1 + - 128 + - 704 + - 704 + - 128 + - 3584 + - - 3 + - 1473.9 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 4288 + - - 14 + - 3919.7 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 2944 + - - 14 + - 3916.51 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3584 + - - 21 + - 2317.16 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 5056 + - - 10 + - 2539.35 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 5888 + - - 14 + - 4367.11 + - - - 5888 + - 704 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 704 + - - 3 + - 1378.85 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 5056 + - - 14 + - 3992.59 + - - - 128 + - 2368 + - 1 + - 128 + - 128 + - 128 + - 128 + - 2368 + - - 2 + - 396.538 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 448 + - - 6 + - 3140.27 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1024 + - - 6 + - 1294.54 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1024 + - - 12 + - 2635.54 + - - - 5056 + - 1024 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 1024 + - - 1 + - 1745.42 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1024 + - - 16 + - 3956.68 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 4 + - - 24 + - 87.2296 + - - - 4288 + - 6784 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 6784 + - - 3 + - 2306.66 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 4 + - - 26 + - 196.122 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 256 + - 4 + - - 29 + - 0.0978968 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 6784 + - - 24 + - 344.27 + - - - 1024 + - 4288 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 4288 + - - 4 + - 1486.24 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 6784 + - - 14 + - 4174.99 + - - - 2368 + - 1856 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 1856 + - - 3 + - 1769.51 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 5056 + - - 14 + - 3691.24 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 2944 + - - 14 + - 4290.09 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 256 + - 5888 + - - 6 + - 2063.07 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 5888 + - - 14 + - 4034.17 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 2944 + - - 14 + - 3846.24 + - - - 1024 + - 256 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 256 + - - 2 + - 360.645 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 128 + - - 6 + - 3176.72 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1408 + - - 10 + - 3344.44 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 704 + - - 6 + - 3326.71 + - - - 3584 + - 6784 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 6784 + - - 4 + - 2006.92 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 3584 + - - 14 + - 4224.57 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 768 + - 256 + - - 6 + - 975.204 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 448 + - - 6 + - 2168.4 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 768 + - 2944 + - - 6 + - 2488.02 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 6784 + - - 14 + - 4303.23 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 6784 + - - 14 + - 4448.94 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 64 + - - 6 + - 2028.13 + - - - 1856 + - 2368 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 2368 + - - 3 + - 1761.97 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 128 + - - 6 + - 2722.04 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 704 + - - 12 + - 2559.39 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 6784 + - - 14 + - 3769.68 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 64 + - - 6 + - 1568.89 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 6784 + - - 14 + - 4388.3 + - - - 64 + - 2368 + - 1 + - 128 + - 64 + - 64 + - 128 + - 2368 + - - 2 + - 218.453 + - - - 1024 + - 3584 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 3584 + - - 4 + - 1310.14 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 256 + - 3584 + - - 25 + - 58.8144 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1024 + - - 17 + - 408.802 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 768 + - 5056 + - - 6 + - 3097.89 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 4 + - - 26 + - 102.98 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1856 + - - 6 + - 2924.99 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1856 + - - 6 + - 2287.84 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 128 + - - 8 + - 270.252 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 4 + - - 24 + - 62.5727 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1856 + - - 14 + - 3832.55 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1024 + - - 14 + - 3492.65 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 448 + - - 9 + - 758.268 + - - - 5888 + - 2368 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 2368 + - - 4 + - 1891.19 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 704 + - - 9 + - 921.046 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1856 + - - 18 + - 4133.48 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 2368 + - - 14 + - 4220.49 + - - - 64 + - 6784 + - 1 + - 128 + - 64 + - 64 + - 128 + - 6784 + - - 2 + - 539.349 + - - - 5888 + - 1408 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 1408 + - - 4 + - 1773.33 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 2368 + - - 6 + - 2234.13 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2944 + - - 6 + - 2064.83 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 5056 + - - 14 + - 4185.97 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 4 + - - 28 + - 49.2591 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 5888 + - - 14 + - 3995.35 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1408 + - - 6 + - 1037.26 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 768 + - 5888 + - - 6 + - 2447.62 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 2368 + - - 18 + - 3975.89 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 448 + - - 11 + - 1152.02 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 5056 + - - 14 + - 3847.8 + - - - 6784 + - 5056 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 5056 + - - 3 + - 2253.43 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 64 + - - 6 + - 2498.33 + - - - 1856 + - 1408 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 1408 + - - 3 + - 1593.44 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 6784 + - - 14 + - 4369.31 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 256 + - 2944 + - - 14 + - 2839.15 + - - - 6784 + - 6784 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 6784 + - - 3 + - 2315.32 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1856 + - - 14 + - 4209.42 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 448 + - - 18 + - 3289.57 + - - - 1024 + - 5888 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 5888 + - - 4 + - 1494.02 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 448 + - - 12 + - 2471.93 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 2368 + - - 14 + - 3705.4 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1856 + - - 6 + - 1319.82 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 256 + - 4 + - - 26 + - 13.8209 + - - - 128 + - 4 + - 1 + - 128 + - 128 + - 128 + - 128 + - 4 + - - 22 + - 1.23004 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 768 + - 4 + - - 26 + - 4.26667 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 6784 + - - 14 + - 4338.11 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 4 + - - 25 + - 41.5211 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 256 + - - 10 + - 2813.25 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 64 + - - 17 + - 564.256 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 256 + - 64 + - - 17 + - 24.4537 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 448 + - - 5 + - 1556.61 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 6784 + - - 14 + - 4257.19 + - - - 448 + - 1024 + - 1 + - 128 + - 448 + - 448 + - 128 + - 1024 + - - 2 + - 573.44 + - - - 64 + - 5056 + - 1 + - 128 + - 64 + - 64 + - 128 + - 5056 + - - 2 + - 414.519 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 6784 + - - 14 + - 4398.8 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1856 + - - 6 + - 2286.37 + - - - 4288 + - 3584 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 3584 + - - 1 + - 2207.28 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 4 + - - 26 + - 14.4991 + - - - 128 + - 1856 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1856 + - - 2 + - 333.137 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1856 + - - 6 + - 714.49 + - - - 2944 + - 5056 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 5056 + - - 3 + - 2157.62 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 4 + - - 26 + - 20.3431 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1408 + - - 7 + - 2863.76 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 4 + - - 26 + - 46.0859 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 704 + - - 9 + - 615.399 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 704 + - - 14 + - 3697.87 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 768 + - 704 + - - 6 + - 2102.61 + - - - 4 + - 3584 + - 1 + - 128 + - 4 + - 4 + - 128 + - 3584 + - - 22 + - 31.3787 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 64 + - - 6 + - 1791.77 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 4288 + - - 14 + - 3981.13 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 256 + - - 5 + - 1674.63 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 128 + - - 6 + - 1022.55 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 256 + - 4288 + - - 6 + - 1715.2 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 704 + - - 14 + - 2940.81 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 768 + - 128 + - - 17 + - 287.019 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 5056 + - - 14 + - 4299.56 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1024 + - - 14 + - 3900.87 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 4 + - - 27 + - 65.4216 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 2944 + - - 18 + - 4067.43 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1408 + - - 6 + - 767.591 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 768 + - 5056 + - - 6 + - 2145.31 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 2944 + - - 10 + - 3417.46 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 5056 + - - 14 + - 4160.01 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 256 + - - 6 + - 2633.85 + - - - 4 + - 704 + - 1 + - 128 + - 4 + - 4 + - 128 + - 704 + - - 22 + - 6.16366 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1024 + - - 29 + - 47.6048 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 3584 + - - 6 + - 3262.24 + - - - 1856 + - 128 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 2 + - 331.973 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 4288 + - - 14 + - 4142.12 + - - - 5888 + - 256 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 256 + - - 0 + - 1058.24 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 768 + - 6784 + - - 14 + - 4192.48 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1024 + - - 16 + - 3262.03 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 64 + - - 11 + - 1539.49 + - - - 1856 + - 256 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 256 + - - 2 + - 604.307 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 1782.74 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1024 + - - 14 + - 3782.89 + - - - 448 + - 448 + - 1 + - 128 + - 448 + - 448 + - 128 + - 448 + - - 2 + - 283.681 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 5056 + - - 16 + - 4242.85 + - - - 4 + - 256 + - 1 + - 128 + - 4 + - 4 + - 128 + - 256 + - - 22 + - 2.263 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 4 + - - 25 + - 135.325 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1408 + - - 6 + - 2150.47 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 6784 + - - 14 + - 4463.66 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 2368 + - - 16 + - 3772.83 + - - - 4 + - 64 + - 1 + - 128 + - 4 + - 4 + - 128 + - 64 + - - 23 + - 0.56497 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 256 + - - 6 + - 1745.2 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1408 + - - 26 + - 179.672 + - - - 4288 + - 256 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 256 + - - 3 + - 855.928 + - - - 2944 + - 1856 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 1856 + - - 1 + - 1723.68 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1856 + - - 14 + - 4146.18 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 768 + - 2368 + - - 6 + - 2026.32 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 6784 + - - 24 + - 295.215 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1856 + - - 14 + - 3984.73 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 5056 + - - 14 + - 4365.93 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 4288 + - - 14 + - 4161.65 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 64 + - - 9 + - 988.049 + - - - 5056 + - 4288 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 4288 + - - 3 + - 2187.57 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 128 + - - 6 + - 1705.21 + - - - 2944 + - 6784 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 6784 + - - 3 + - 2142.93 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 2368 + - - 16 + - 3716.22 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 256 + - 5056 + - - 6 + - 1593.03 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 3584 + - - 14 + - 4394.05 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 128 + - - 12 + - 1222.83 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 768 + - 5888 + - - 25 + - 190.963 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1024 + - - 14 + - 3210.16 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 128 + - - 6 + - 2489.74 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 448 + - - 6 + - 3238.45 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 2368 + - - 14 + - 4051.23 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 768 + - 4288 + - - 12 + - 1987.59 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 2944 + - - 14 + - 4136.75 + - - - 6784 + - 4 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 4 + - - 22 + - 62.8336 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1856 + - - 16 + - 3650.86 + - - - 2368 + - 448 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 448 + - - 3 + - 851.245 + - - - 1024 + - 64 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 64 + - - 2 + - 94.2117 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 128 + - - 5 + - 1056.81 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 2368 + - - 16 + - 3908.77 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1024 + - - 16 + - 3429.59 + - - - 256 + - 128 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 2 + - 47.5329 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 64 + - - 12 + - 2102.3 + - - - 5056 + - 3584 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 3584 + - - 3 + - 2200.45 + - - - 128 + - 256 + - 1 + - 128 + - 128 + - 128 + - 128 + - 256 + - - 2 + - 48.3215 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 6784 + - - 14 + - 4236.26 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 3584 + - - 14 + - 4061.33 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 256 + - - 10 + - 2826.33 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 6784 + - - 14 + - 3947.7 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 64 + - - 21 + - 2101.37 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1408 + - - 16 + - 4056.44 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 5888 + - - 14 + - 4451.22 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 5888 + - - 14 + - 3722.55 + - - - 4288 + - 4288 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 4288 + - - 1 + - 2208.98 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 64 + - - 6 + - 3174.13 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 2368 + - - 14 + - 3544.36 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 128 + - - 6 + - 3345.07 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 2944 + - - 14 + - 4306.35 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 448 + - - 6 + - 2746.57 + - - - 1408 + - 704 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 704 + - - 2 + - 790.22 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 5056 + - - 16 + - 3949.63 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 704 + - - 14 + - 3156.71 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 448 + - - 18 + - 3995.45 + - - - 2944 + - 2944 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 2944 + - - 3 + - 1963.95 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 64 + - - 26 + - 7.87692 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 3584 + - - 14 + - 4358.45 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 4 + - - 26 + - 180.642 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 4288 + - - 14 + - 4289.98 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 768 + - 5888 + - - 6 + - 2647.34 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 5888 + - - 14 + - 3898.41 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 2944 + - - 14 + - 3617.92 + - - - 2944 + - 4288 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 4288 + - - 3 + - 2052.87 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1024 + - - 14 + - 4163.13 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1408 + - - 6 + - 2610.65 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 5056 + - - 16 + - 4025.78 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1408 + - - 14 + - 3617.59 + - - - 1856 + - 1024 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 1024 + - - 3 + - 1466.89 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 704 + - - 26 + - 98.277 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 2368 + - - 14 + - 3583.69 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 768 + - 4288 + - - 6 + - 3210.73 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 2368 + - - 18 + - 3920.2 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 704 + - - 6 + - 3214.41 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1024 + - - 14 + - 3867.15 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1408 + - - 11 + - 1350.38 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 128 + - - 21 + - 1407.48 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 256 + - 128 + - - 25 + - 3.35051 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 448 + - - 6 + - 3403.06 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1856 + - - 18 + - 3880.26 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 4288 + - - 14 + - 4149.39 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 3584 + - - 14 + - 4199.39 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1408 + - - 14 + - 3521.01 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1024 + - - 12 + - 2821.12 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 448 + - - 14 + - 3517.53 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 6784 + - - 14 + - 3964.46 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 4 + - - 26 + - 10.7899 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 2944 + - - 6 + - 3267.55 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1856 + - - 14 + - 4054.97 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 6784 + - - 14 + - 4310.4 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 6784 + - - 6 + - 3294.01 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 256 + - - 12 + - 2214.46 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 448 + - - 6 + - 3440.14 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 5888 + - - 14 + - 4101.95 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 256 + - - 29 + - 27.9386 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 64 + - - 19 + - 152.283 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 2368 + - - 14 + - 4141.82 + - - - 1024 + - 6784 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 6784 + - - 4 + - 1629.04 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 256 + - 704 + - - 6 + - 1564.07 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1856 + - - 26 + - 225.925 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 5056 + - - 14 + - 4363.54 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 256 + - 3584 + - - 6 + - 1241.97 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 3584 + - - 16 + - 3794.12 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 4288 + - - 14 + - 3830.08 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3584 + - - 6 + - 3422.54 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 256 + - 4 + - - 25 + - 1.75418 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 6784 + - - 14 + - 4470.8 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1856 + - - 14 + - 3826.95 + - - - 256 + - 5056 + - 1 + - 128 + - 256 + - 256 + - 128 + - 5056 + - - 4 + - 759.42 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 768 + - 704 + - - 26 + - 35.6174 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1856 + - - 14 + - 4135.08 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 256 + - - 8 + - 260.84 + - - - 704 + - 6784 + - 1 + - 128 + - 704 + - 704 + - 128 + - 6784 + - - 4 + - 1843.99 + - - - 1856 + - 2944 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 2944 + - - 3 + - 1884.97 + - - - 3584 + - 1408 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 1408 + - - 4 + - 1501.31 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 5056 + - - 14 + - 4250.78 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 2944 + - - 14 + - 4350.29 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 64 + - - 6 + - 2852.9 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 128 + - - 6 + - 1319.82 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 4288 + - - 25 + - 255.626 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 256 + - 3584 + - - 14 + - 3401.03 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 704 + - - 6 + - 2730.4 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 64 + - - 9 + - 448.814 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 2944 + - - 16 + - 2748.4 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 64 + - - 5 + - 1522.32 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 128 + - - 11 + - 1468.91 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 5888 + - - 14 + - 4414.82 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 256 + - 6784 + - - 6 + - 2340.97 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 5888 + - - 6 + - 2864.81 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 64 + - - 6 + - 1043.13 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 2368 + - - 14 + - 4036.35 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1408 + - - 14 + - 4198.29 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 6784 + - - 6 + - 3322.62 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 448 + - - 6 + - 3512.62 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 768 + - 4 + - - 26 + - 36.0448 + - - - 5888 + - 5888 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 5888 + - - 1 + - 1910.58 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 704 + - - 12 + - 1673.72 + - - - 4288 + - 128 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 2 + - 649.543 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 256 + - 128 + - - 17 + - 369.217 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 3584 + - - 14 + - 4286.86 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1856 + - - 16 + - 3894.58 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 5888 + - - 14 + - 4374.04 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 256 + - 704 + - - 6 + - 550.302 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1408 + - - 14 + - 3715.62 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 3584 + - - 14 + - 4359.77 + - - - 1408 + - 1856 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 1856 + - - 3 + - 1461.45 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1408 + - - 14 + - 3992.11 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1024 + - - 6 + - 1900.33 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 128 + - - 6 + - 2171.03 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 5888 + - - 14 + - 4297.72 + - - - 256 + - 3584 + - 1 + - 128 + - 256 + - 256 + - 128 + - 3584 + - - 2 + - 749.365 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 2368 + - - 10 + - 3093.07 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 2368 + - - 6 + - 3475.42 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1856 + - - 6 + - 3232.7 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 2368 + - - 14 + - 3634.65 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 2944 + - - 16 + - 3411.77 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 256 + - 2368 + - - 6 + - 1494.5 + - - - 6784 + - 64 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 64 + - - 2 + - 554.415 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 128 + - - 6 + - 2934.25 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 128 + - - 6 + - 2977.7 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 768 + - 6784 + - - 6 + - 2997.55 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 5888 + - - 6 + - 2761.22 + - - - 5888 + - 64 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 64 + - - 2 + - 477.758 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 256 + - 6784 + - - 24 + - 100.971 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 768 + - 448 + - - 6 + - 1645.4 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 768 + - 128 + - - 8 + - 78.2519 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 5888 + - - 14 + - 4216.99 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 3584 + - - 14 + - 3980.94 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 4288 + - - 25 + - 327.455 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1856 + - - 5 + - 1214.41 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 6784 + - - 14 + - 4096.48 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 5056 + - - 14 + - 4202.94 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 768 + - 3584 + - - 14 + - 3732.22 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1856 + - - 12 + - 2106.7 + - - - 1024 + - 4 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 4 + - - 22 + - 9.79621 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1024 + - - 14 + - 3984.54 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 2368 + - - 14 + - 4110.62 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1408 + - - 6 + - 2690.22 + - - - 4 + - 448 + - 1 + - 128 + - 4 + - 4 + - 128 + - 448 + - - 23 + - 4.027 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 2944 + - - 6 + - 3444.89 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 3584 + - - 18 + - 4051.1 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 256 + - - 6 + - 2014.26 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 5056 + - - 14 + - 4173.16 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 4 + - - 29 + - 65.3308 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 2368 + - - 14 + - 4220.1 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 6784 + - - 10 + - 3468.55 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 448 + - - 6 + - 3355.71 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 448 + - - 9 + - 663.379 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 4288 + - - 14 + - 4311.37 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 4 + - - 25 + - 24.9964 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 2368 + - - 16 + - 3961.51 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 5056 + - - 25 + - 343.396 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 2064.83 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 768 + - 4 + - - 26 + - 0.268531 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 256 + - 5056 + - - 6 + - 1997.05 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 704 + - - 10 + - 2489.62 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 5056 + - - 14 + - 4027.44 + - - - 1856 + - 3584 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 3584 + - - 3 + - 1996.07 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 3584 + - - 6 + - 2507.27 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 256 + - 3584 + - - 14 + - 2990.7 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 2944 + - - 14 + - 4336.07 + - - - 448 + - 1856 + - 1 + - 128 + - 448 + - 448 + - 128 + - 1856 + - - 2 + - 905.021 + - - - 64 + - 2944 + - 1 + - 128 + - 64 + - 64 + - 128 + - 2944 + - - 3 + - 210.227 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 6784 + - - 14 + - 3757.94 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 4288 + - - 14 + - 4224.84 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 704 + - - 16 + - 4020.86 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 4 + - - 26 + - 154.122 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 17 + - 211.406 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 128 + - - 26 + - 14.5359 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 448 + - - 6 + - 2922.84 + - - - 5888 + - 5056 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 5056 + - - 1 + - 1902.68 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 704 + - - 14 + - 3545.39 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 2944 + - - 6 + - 3225.35 + - - - 4 + - 4288 + - 1 + - 128 + - 4 + - 4 + - 128 + - 4288 + - - 22 + - 37.7489 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1856 + - - 6 + - 3852.02 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 768 + - 2368 + - - 6 + - 1210.4 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 704 + - - 18 + - 3344.2 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1024 + - - 14 + - 1959.96 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 768 + - 2944 + - - 6 + - 3160.65 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 128 + - - 19 + - 230.729 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1408 + - - 6 + - 3388.3 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 5056 + - - 25 + - 271.757 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 2368 + - - 26 + - 181.036 + - - - 2368 + - 5888 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 5888 + - - 3 + - 2147.11 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 6784 + - - 14 + - 4334.69 + - - - 128 + - 1408 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1408 + - - 2 + - 259.782 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 768 + - 64 + - - 8 + - 41.6984 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 256 + - 5888 + - - 14 + - 3543.68 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 256 + - - 6 + - 3388.51 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 128 + - - 9 + - 1160.83 + - - - 3584 + - 704 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 704 + - - 4 + - 1246.76 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 4288 + - - 14 + - 4078.8 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 448 + - - 6 + - 1990.64 + - - - 64 + - 704 + - 1 + - 128 + - 64 + - 64 + - 128 + - 704 + - - 2 + - 63.9659 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 4 + - - 27 + - 77.5981 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 768 + - 5888 + - - 14 + - 3880.34 + - - - 704 + - 128 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 2 + - 131.191 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 2368 + - - 16 + - 3087.17 + - - - 2368 + - 1024 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 1024 + - - 3 + - 1463.5 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 256 + - 64 + - - 17 + - 184.608 + - - - 256 + - 64 + - 1 + - 128 + - 256 + - 256 + - 128 + - 64 + - - 2 + - 23.5741 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 256 + - - 6 + - 2987.8 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1408 + - - 16 + - 3596.38 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1024 + - - 6 + - 1070.89 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 768 + - 448 + - - 6 + - 974.34 + - - - 3584 + - 1856 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 1856 + - - 4 + - 1677.39 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 256 + - - 14 + - 2849.45 + - - - 1024 + - 128 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 2 + - 191.521 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 704 + - - 14 + - 3627.59 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1408 + - - 14 + - 4103.69 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 4288 + - - 14 + - 4185.89 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1408 + - - 6 + - 2401.32 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 2944 + - - 21 + - 1943.98 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 5888 + - - 25 + - 287.816 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 5888 + - - 14 + - 3349.44 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 256 + - - 10 + - 3246.57 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1024 + - - 16 + - 3786.81 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 768 + - 3584 + - - 14 + - 3378.8 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 4 + - - 26 + - 92.2115 + - - - 6784 + - 1024 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 1024 + - - 3 + - 1820.63 + - - - 1408 + - 448 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 448 + - - 2 + - 725.56 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 5888 + - - 14 + - 4469.75 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1408 + - - 14 + - 3898.2 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 4 + - - 27 + - 98.3411 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 4288 + - - 14 + - 3112.74 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1024 + - - 6 + - 2181.29 + - - - 4288 + - 704 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 704 + - - 1 + - 1473.01 + - - - 2944 + - 1024 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 1024 + - - 1 + - 1425.79 + - - - 256 + - 1024 + - 1 + - 128 + - 256 + - 256 + - 128 + - 1024 + - - 2 + - 317.991 + - - - 5056 + - 704 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 704 + - - 1 + - 1705.62 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 4288 + - - 14 + - 4246.58 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 6 + - 2185.89 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1856 + - - 14 + - 3794.9 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 256 + - 64 + - - 17 + - 53.2813 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1856 + - - 6 + - 3632.06 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1024 + - - 14 + - 3677.22 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 2368 + - - 18 + - 4015.85 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1408 + - - 18 + - 4115.4 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 6784 + - - 14 + - 4453.3 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 256 + - - 6 + - 2669.1 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 2944 + - - 6 + - 2941.68 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1408 + - - 12 + - 2300.73 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1408 + - - 16 + - 3786.73 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 4 + - - 24 + - 141.819 + - - - 5056 + - 5888 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 5888 + - - 3 + - 2289.54 + - - - 256 + - 448 + - 1 + - 128 + - 256 + - 256 + - 128 + - 448 + - - 2 + - 167.428 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 448 + - - 6 + - 2718.53 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 768 + - 448 + - - 6 + - 2098.24 + - - - 256 + - 4288 + - 1 + - 128 + - 256 + - 256 + - 128 + - 4288 + - - 4 + - 726.371 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 128 + - - 12 + - 2365.88 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 448 + - - 6 + - 2239.29 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 768 + - 5056 + - - 12 + - 2305.31 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1024 + - - 16 + - 3332.59 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 768 + - 5056 + - - 6 + - 3322.36 + - - - 2368 + - 128 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 2 + - 404.813 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 128 + - - 6 + - 2845.93 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 5888 + - - 14 + - 3288.61 + - - - 704 + - 704 + - 1 + - 128 + - 704 + - 704 + - 128 + - 704 + - - 2 + - 591.78 + - - - 6784 + - 1408 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 1408 + - - 3 + - 2008.81 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 4 + - - 29 + - 48.7256 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1408 + - - 6 + - 3624.3 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 64 + - - 26 + - 10.6924 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 704 + - - 6 + - 2796.76 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1856 + - - 14 + - 4161.04 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1856 + - - 21 + - 2465.16 + - - - 64 + - 128 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 2 + - 11.5686 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 6784 + - - 14 + - 3378.9 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1856 + - - 5 + - 1698.66 + - - - 5888 + - 3584 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 3584 + - - 3 + - 1850.8 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 3584 + - - 16 + - 3197.4 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3584 + - - 14 + - 3583.58 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 4288 + - - 14 + - 4194.22 + - - - 2368 + - 1408 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 1408 + - - 1 + - 1675.45 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 5888 + - - 14 + - 4289.0 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3584 + - - 14 + - 4065.82 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 4 + - - 29 + - 194.699 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 5888 + - - 14 + - 4298.63 + - - - 1856 + - 64 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 64 + - - 2 + - 170.147 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1408 + - - 14 + - 3751.5 + - - - 2944 + - 256 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 256 + - - 2 + - 831.629 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 128 + - - 6 + - 1101.83 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1024 + - - 5 + - 748.601 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 1302.58 + - - - 448 + - 256 + - 1 + - 128 + - 448 + - 448 + - 128 + - 256 + - - 2 + - 168.814 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1024 + - - 7 + - 3177.17 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 3584 + - - 14 + - 4218.1 + - - - 128 + - 704 + - 1 + - 128 + - 128 + - 128 + - 128 + - 704 + - - 2 + - 130.597 + - - - 1024 + - 2944 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 2944 + - - 4 + - 1234.25 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 3584 + - - 25 + - 228.887 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 2944 + - - 14 + - 4131.78 + - - - 2368 + - 5056 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 5056 + - - 3 + - 2100.23 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 2944 + - - 14 + - 4079.25 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 64 + - - 20 + - 2120.43 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 6784 + - - 14 + - 4327.63 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 768 + - 4288 + - - 6 + - 1820.7 + - - - 1856 + - 704 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 704 + - - 3 + - 1047.92 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 2368 + - - 6 + - 3706.33 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 128 + - - 10 + - 2817.47 + - - - 704 + - 2944 + - 1 + - 128 + - 704 + - 704 + - 128 + - 2944 + - - 3 + - 1227.74 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1024 + - - 14 + - 2614.01 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 5888 + - - 14 + - 4324.17 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 2368 + - - 6 + - 2806.32 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1856 + - - 14 + - 3709.73 + - - - 4 + - 6784 + - 1 + - 128 + - 4 + - 4 + - 128 + - 6784 + - - 22 + - 60.1357 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 448 + - - 6 + - 2739.19 + - - - 2944 + - 4 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 4 + - - 22 + - 27.0715 + - - - 256 + - 4 + - 1 + - 128 + - 256 + - 256 + - 128 + - 4 + - - 22 + - 2.47869 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1408 + - - 6 + - 3748.66 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 5056 + - - 14 + - 4378.79 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 2368 + - - 6 + - 2732.68 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 128 + - - 9 + - 406.667 + - - - 64 + - 1408 + - 1 + - 128 + - 64 + - 64 + - 128 + - 1408 + - - 2 + - 134.37 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 4 + - - 25 + - 32.1908 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 128 + - - 9 + - 689.853 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 448 + - - 21 + - 2173.73 + - - - 1408 + - 64 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 64 + - - 2 + - 129.541 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 768 + - 2944 + - - 12 + - 1461.06 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 5888 + - - 14 + - 4378.32 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 128 + - - 7 + - 2928.23 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 448 + - - 6 + - 3147.23 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 6784 + - - 14 + - 4541.16 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 14 + - 2735.93 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 6784 + - - 18 + - 4118.04 + - - - 704 + - 1408 + - 1 + - 128 + - 704 + - 704 + - 128 + - 1408 + - - 4 + - 804.653 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 64 + - - 6 + - 998.534 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 4 + - - 25 + - 65.7507 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 64 + - - 6 + - 2774.83 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 4288 + - - 18 + - 4146.53 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 4 + - - 25 + - 150.511 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 4288 + - - 10 + - 2639.32 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 256 + - - 6 + - 3242.17 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 5056 + - - 6 + - 3496.28 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 128 + - - 12 + - 1668.88 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 4288 + - - 6 + - 2032.16 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 64 + - - 19 + - 414.331 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1408 + - - 14 + - 4348.82 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3584 + - - 14 + - 4280.57 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1856 + - - 16 + - 3823.12 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 5888 + - - 14 + - 3317.37 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 2944 + - - 14 + - 3988.33 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 768 + - 4288 + - - 14 + - 3971.96 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 768 + - 3584 + - - 25 + - 139.58 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 256 + - - 14 + - 3765.58 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 64 + - - 19 + - 239.991 + - - - 64 + - 4 + - 1 + - 128 + - 64 + - 64 + - 128 + - 4 + - - 22 + - 0.605923 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1856 + - - 18 + - 4034.94 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 5056 + - - 6 + - 3304.44 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 768 + - 64 + - - 8 + - 150.226 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 768 + - 448 + - - 17 + - 496.843 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 25 + - 5.71867 + - - - 64 + - 64 + - 1 + - 128 + - 64 + - 64 + - 128 + - 64 + - - 2 + - 5.72867 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1856 + - - 6 + - 3416.44 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 6784 + - - 6 + - 3166.9 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 64 + - - 6 + - 1361.52 + - - - 5888 + - 448 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 448 + - - 3 + - 1173.34 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 768 + - 2368 + - - 12 + - 2206.06 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 4 + - - 26 + - 28.5294 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 768 + - 704 + - - 17 + - 394.291 + - - - 6784 + - 128 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 2 + - 942.58 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 5056 + - - 14 + - 4217.11 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1408 + - - 14 + - 3985.6 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1856 + - - 18 + - 2939.46 + - - - 2944 + - 1408 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 1408 + - - 3 + - 1564.95 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 256 + - - 5 + - 2076.24 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 768 + - 5056 + - - 16 + - 3760.79 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 14 + - 3004.03 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3584 + - - 16 + - 4385.76 + - - - 3584 + - 2944 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 2944 + - - 4 + - 1806.54 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 256 + - - 5 + - 1222.76 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 448 + - - 9 + - 1157.45 + - - - 704 + - 4288 + - 1 + - 128 + - 704 + - 704 + - 128 + - 4288 + - - 1 + - 1427.31 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 5888 + - - 6 + - 2815.56 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 2944 + - - 14 + - 3733.63 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 64 + - - 12 + - 1488.72 + - - - 128 + - 4288 + - 1 + - 128 + - 128 + - 128 + - 128 + - 4288 + - - 2 + - 607.739 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 704 + - - 12 + - 2888.03 + - - - 64 + - 4288 + - 1 + - 128 + - 64 + - 64 + - 128 + - 4288 + - - 2 + - 357.566 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 256 + - 2368 + - - 14 + - 2976.91 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 5888 + - - 14 + - 4387.75 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 704 + - - 14 + - 3790.63 + - - - 64 + - 1856 + - 1 + - 128 + - 64 + - 64 + - 128 + - 1856 + - - 2 + - 180.317 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1856 + - - 14 + - 4007.93 + - - - 4288 + - 2944 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 2944 + - - 3 + - 2146.46 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 2944 + - - 14 + - 3703.84 + - - - 1856 + - 4 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 4 + - - 22 + - 17.0668 + - - - 64 + - 1024 + - 1 + - 128 + - 64 + - 64 + - 128 + - 1024 + - - 2 + - 95.4118 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 256 + - 5056 + - - 27 + - 76.5879 + - - - 5056 + - 2944 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 2944 + - - 1 + - 2165.47 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 6784 + - - 14 + - 4285.9 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1408 + - - 6 + - 1467.47 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 768 + - 5888 + - - 14 + - 3654.13 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1408 + - - 6 + - 3679.57 + - - - 256 + - 1408 + - 1 + - 128 + - 256 + - 256 + - 128 + - 1408 + - - 2 + - 383.201 + - - - 6784 + - 4288 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 4288 + - - 3 + - 2247.95 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1856 + - - 14 + - 4013.58 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 704 + - - 6 + - 3279.17 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 448 + - - 6 + - 3561.0 + - - - 256 + - 256 + - 1 + - 128 + - 256 + - 256 + - 128 + - 256 + - - 2 + - 92.6304 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 4 + - - 25 + - 58.9656 + - - - 5056 + - 1856 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 1856 + - - 1 + - 2074.09 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3584 + - - 18 + - 3979.75 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1408 + - - 14 + - 3804.96 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 6784 + - - 14 + - 4304.48 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 768 + - 2368 + - - 14 + - 3447.63 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 5056 + - - 16 + - 4047.07 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 3584 + - - 14 + - 4235.04 + - - - 448 + - 1408 + - 1 + - 128 + - 448 + - 448 + - 128 + - 1408 + - - 2 + - 729.23 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 2944 + - - 16 + - 3360.79 + - - - 4 + - 1408 + - 1 + - 128 + - 4 + - 4 + - 128 + - 1408 + - - 22 + - 12.782 + - - - 128 + - 2944 + - 1 + - 128 + - 128 + - 128 + - 128 + - 2944 + - - 2 + - 455.042 + - - - 1408 + - 6784 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 6784 + - - 3 + - 1970.73 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 704 + - - 14 + - 3696.9 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 2368 + - - 18 + - 3972.14 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1856 + - - 14 + - 3600.7 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1408 + - - 14 + - 3637.74 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3584 + - - 25 + - 299.087 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 3584 + - - 14 + - 4360.31 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1856 + - - 14 + - 3908.18 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 5056 + - - 18 + - 4036.73 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 128 + - - 6 + - 2030.33 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1856 + - - 18 + - 3665.17 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 256 + - 4288 + - - 25 + - 67.5109 + - - - 2944 + - 2368 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 2368 + - - 3 + - 1832.77 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 64 + - - 9 + - 674.254 + - - - 2368 + - 2944 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 2944 + - - 1 + - 1930.13 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3584 + - - 14 + - 4319.35 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 768 + - 64 + - - 26 + - 4.2965 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 64 + - - 19 + - 131.375 + - - - 3584 + - 5888 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 5888 + - - 4 + - 1885.32 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 704 + - - 14 + - 3708.99 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 6 + - 2307.19 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1856 + - - 25 + - 32.3222 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 6784 + - - 14 + - 4449.05 + - - - 3584 + - 448 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 448 + - - 4 + - 1026.78 + - - - 448 + - 128 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 2 + - 84.8755 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 3584 + - - 14 + - 3747.81 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 5056 + - - 14 + - 4028.67 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 2368 + - - 5 + - 1765.49 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 4 + - - 26 + - 178.447 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 768 + - 4288 + - - 6 + - 2643.8 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 64 + - - 6 + - 2140.87 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 768 + - 4 + - - 26 + - 24.8601 + - - - 128 + - 448 + - 1 + - 128 + - 128 + - 128 + - 128 + - 448 + - - 2 + - 84.3294 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1856 + - - 14 + - 3723.24 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 2368 + - - 14 + - 4153.7 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 256 + - 2368 + - - 6 + - 2260.16 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 2944 + - - 14 + - 4282.68 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 448 + - - 6 + - 3531.03 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 2944 + - - 26 + - 277.24 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1408 + - - 14 + - 3662.35 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 256 + - 2944 + - - 6 + - 1863.77 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 64 + - - 5 + - 1778.13 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 17 + - 409.6 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 5056 + - - 14 + - 4267.29 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1024 + - - 14 + - 3157.62 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 5888 + - - 14 + - 4190.54 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3584 + - - 18 + - 4076.96 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 448 + - - 26 + - 67.0388 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1024 + - - 14 + - 3445.75 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 64 + - - 9 + - 655.36 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 256 + - 3584 + - - 6 + - 2178.05 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 768 + - 4 + - - 26 + - 15.147 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1408 + - - 6 + - 3070.61 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 4 + - - 26 + - 7.70753 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 4 + - - 26 + - 119.125 + - - - 5056 + - 6784 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 6784 + - - 1 + - 2331.35 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 5888 + - - 14 + - 3929.28 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 448 + - - 16 + - 3378.1 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 3584 + - - 14 + - 4278.18 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 256 + - - 6 + - 3105.04 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 5056 + - - 14 + - 4150.22 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 6784 + - - 14 + - 4317.69 + - - - 6784 + - 2944 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 2944 + - - 3 + - 2195.79 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 704 + - - 18 + - 3912.39 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 5888 + - - 14 + - 4288.37 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 1892.55 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1024 + - - 6 + - 776.723 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 2368 + - - 12 + - 1403.96 + - - - 3584 + - 2368 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 2368 + - - 4 + - 1789.31 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 2368 + - - 26 + - 258.894 + - - - 448 + - 2368 + - 1 + - 128 + - 448 + - 448 + - 128 + - 2368 + - - 4 + - 826.781 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 768 + - 704 + - - 6 + - 767.591 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1024 + - - 16 + - 3385.73 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 2944 + - - 16 + - 3926.46 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 128 + - - 6 + - 2391.33 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 2368 + - - 14 + - 3578.14 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 4 + - - 26 + - 167.805 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 2368 + - - 14 + - 4243.79 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 256 + - - 9 + - 746.522 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 5056 + - - 16 + - 4350.66 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1408 + - - 5 + - 998.767 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 2944 + - - 14 + - 4353.0 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 4288 + - - 14 + - 4033.43 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1856 + - - 14 + - 3770.5 + - - - 2368 + - 3584 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 3584 + - - 3 + - 2050.91 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 128 + - - 6 + - 2650.25 + - - - 448 + - 704 + - 1 + - 128 + - 448 + - 448 + - 128 + - 704 + - - 2 + - 416.016 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 64 + - - 6 + - 2484.51 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 768 + - 3584 + - - 6 + - 2926.26 + - - - 1024 + - 1024 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 1024 + - - 4 + - 764.338 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3584 + - - 14 + - 4366.79 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 256 + - 2944 + - - 25 + - 49.1948 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 2944 + - - 26 + - 199.836 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1024 + - - 6 + - 2983.75 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 3584 + - - 14 + - 3935.22 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 5888 + - - 14 + - 4415.85 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 4288 + - - 14 + - 4290.87 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 768 + - 64 + - - 17 + - 250.913 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 2944 + - - 14 + - 4249.66 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 256 + - - 6 + - 2935.9 + - - - 128 + - 5888 + - 1 + - 128 + - 128 + - 128 + - 128 + - 5888 + - - 2 + - 779.484 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 2944 + - - 16 + - 4246.43 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 6784 + - - 14 + - 4377.96 + - - - 5888 + - 4288 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 4288 + - - 4 + - 2015.49 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 704 + - - 14 + - 3455.36 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 256 + - 4288 + - - 14 + - 2873.29 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 3584 + - - 14 + - 3825.52 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 768 + - 2944 + - - 6 + - 2668.82 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 5888 + - - 14 + - 4321.94 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1408 + - - 6 + - 1969.28 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 2944 + - - 14 + - 4291.77 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 5888 + - - 14 + - 3829.55 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 2944 + - - 14 + - 4208.83 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 5056 + - - 12 + - 2458.71 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 2944 + - - 16 + - 3965.52 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 4288 + - - 14 + - 3760.67 + - - - 256 + - 1856 + - 1 + - 128 + - 256 + - 256 + - 128 + - 1856 + - - 2 + - 468.981 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 128 + - - 5 + - 2018.66 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 768 + - 128 + - - 17 + - 495.948 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 6784 + - - 14 + - 4207.7 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 64 + - - 6 + - 697.447 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 448 + - - 26 + - 46.2985 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1024 + - - 10 + - 2134.51 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 5056 + - - 14 + - 4393.36 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 2944 + - - 14 + - 4170.09 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 704 + - - 6 + - 1042.89 + - - - 2944 + - 64 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 64 + - - 2 + - 262.601 + - - - 704 + - 4 + - 1 + - 128 + - 704 + - 704 + - 128 + - 4 + - - 22 + - 6.84748 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 768 + - 4 + - - 29 + - 7.87692 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 4288 + - - 14 + - 3635.11 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 128 + - - 6 + - 2077.28 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 6784 + - - 14 + - 4472.49 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 5056 + - - 14 + - 4205.98 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 4288 + - - 14 + - 4139.4 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 128 + - - 6 + - 2243.73 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 3584 + - - 14 + - 3844.03 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 2368 + - - 14 + - 3926.62 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 256 + - - 9 + - 494.611 + - - - 3584 + - 4288 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 4288 + - - 4 + - 1896.14 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 4288 + - - 14 + - 3879.42 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1408 + - - 10 + - 3021.56 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 256 + - 64 + - - 17 + - 294.845 + - - - 4 + - 5888 + - 1 + - 128 + - 4 + - 4 + - 128 + - 5888 + - - 23 + - 51.5506 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 128 + - - 12 + - 2175.6 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1856 + - - 14 + - 3969.94 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1024 + - - 12 + - 2400.75 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 2368 + - - 6 + - 3846.67 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1024 + - - 12 + - 2607.61 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 4 + - - 24 + - 67.1804 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 5056 + - - 14 + - 3641.35 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 256 + - 4288 + - - 14 + - 3351.84 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 2368 + - - 14 + - 3949.8 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1024 + - - 16 + - 3881.05 + - - - 704 + - 5056 + - 1 + - 128 + - 704 + - 704 + - 128 + - 5056 + - - 1 + - 1679.47 + - - - 1856 + - 1856 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 1856 + - - 1 + - 1725.06 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 2944 + - - 6 + - 2786.74 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1408 + - - 14 + - 3258.78 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 448 + - - 18 + - 3217.97 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1856 + - - 14 + - 4009.94 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 2368 + - - 16 + - 3550.11 + - - - 2944 + - 128 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 2 + - 483.118 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 768 + - 448 + - - 17 + - 250.684 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 2368 + - - 14 + - 4180.98 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 5056 + - - 14 + - 4215.39 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 448 + - - 18 + - 2750.55 + - - - 448 + - 6784 + - 1 + - 128 + - 448 + - 448 + - 128 + - 6784 + - - 1 + - 1479.4 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 64 + - - 6 + - 1238.21 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 448 + - - 18 + - 2830.48 + - - - 1856 + - 448 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 448 + - - 2 + - 900.732 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 128 + - - 6 + - 3042.4 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 4288 + - - 14 + - 4266.67 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 4288 + - - 14 + - 3787.5 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 448 + - - 9 + - 427.03 + - - - 5056 + - 5056 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 5056 + - - 1 + - 2249.91 + - - - 1024 + - 1408 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 1408 + - - 4 + - 954.039 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 5888 + - - 14 + - 4077.8 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 768 + - 128 + - - 8 + - 149.797 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 256 + - 5888 + - - 27 + - 88.3545 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 2944 + - - 14 + - 4345.57 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 6784 + - - 14 + - 3848.24 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 4288 + - - 14 + - 4255.32 + - - - 6784 + - 3584 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 3584 + - - 3 + - 2206.09 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 2368 + - - 14 + - 3841.52 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 5056 + - - 6 + - 2373.37 + - - - 3584 + - 64 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 64 + - - 2 + - 313.945 + - - - 1408 + - 1024 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 1024 + - - 3 + - 1082.02 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 5888 + - - 14 + - 4445.64 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1024 + - - 11 + - 1028.79 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1408 + - - 12 + - 1653.16 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 14 + - 2456.63 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 256 + - - 14 + - 3541.28 + - - - 2368 + - 64 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 64 + - - 2 + - 211.038 + - - - 128 + - 3584 + - 1 + - 128 + - 128 + - 128 + - 128 + - 3584 + - - 2 + - 553.965 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 256 + - 704 + - - 28 + - 13.4697 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 704 + - - 10 + - 2987.41 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 704 + - - 6 + - 3207.17 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 6784 + - - 14 + - 4357.86 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 256 + - - 6 + - 1935.41 + - - - 1024 + - 704 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 704 + - - 2 + - 708.497 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 64 + - - 6 + - 2089.27 + - - - 4288 + - 64 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 64 + - - 2 + - 365.605 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1024 + - - 14 + - 3788.51 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 768 + - 64 + - - 8 + - 81.243 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 5888 + - - 16 + - 4158.87 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1408 + - - 6 + - 1771.79 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 704 + - - 5 + - 2175.12 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1024 + - - 14 + - 3016.17 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 3584 + - - 16 + - 4344.42 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 5056 + - - 14 + - 3972.04 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 256 + - - 14 + - 3150.52 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1024 + - - 12 + - 2072.66 + - - - 5056 + - 2368 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 2368 + - - 3 + - 2044.64 + - - - 5888 + - 4 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 4 + - - 22 + - 54.5348 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1408 + - - 14 + - 3317.19 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 128 + - - 7 + - 2579.92 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 768 + - 5056 + - - 25 + - 172.426 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 704 + - - 14 + - 3331.43 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 704 + - - 11 + - 1417.8 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1408 + - - 26 + - 122.009 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 5056 + - - 14 + - 4336.72 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 64 + - - 12 + - 2238.86 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 448 + - - 6 + - 3465.34 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 256 + - 5056 + - - 14 + - 2973.04 + - - - 2944 + - 3584 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 3584 + - - 3 + - 2035.7 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 128 + - - 6 + - 2026.32 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 256 + - 704 + - - 17 + - 291.271 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1024 + - - 14 + - 3716.54 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1408 + - - 6 + - 3631.36 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 6784 + - - 14 + - 3900.56 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 448 + - - 18 + - 4074.16 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1024 + - - 6 + - 1726.05 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1408 + - - 25 + - 24.5872 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1024 + - - 12 + - 2566.17 + - - - 1408 + - 1408 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 1408 + - - 3 + - 1123.61 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 768 + - 128 + - - 26 + - 7.81431 + - - - 64 + - 256 + - 1 + - 128 + - 64 + - 64 + - 128 + - 256 + - - 2 + - 23.2397 + - - - 3584 + - 128 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 2 + - 532.272 + - - - 5056 + - 128 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 2 + - 739.621 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1024 + - - 16 + - 2927.74 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 5056 + - - 14 + - 3987.13 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 128 + - - 9 + - 492.62 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 448 + - - 6 + - 1856.99 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 2368 + - - 14 + - 3983.14 + - - - 4 + - 2944 + - 1 + - 128 + - 4 + - 4 + - 128 + - 2944 + - - 22 + - 26.1328 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 5056 + - - 14 + - 3223.25 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 5888 + - - 14 + - 4322.83 + - - - 4288 + - 5056 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 5056 + - - 3 + - 2244.03 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 64 + - - 17 + - 106.563 + - - - 1408 + - 3584 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 3584 + - - 3 + - 1719.35 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 4 + - - 26 + - 18.5392 + - - - 1856 + - 5056 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 5056 + - - 1 + - 2114.69 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 2368 + - - 6 + - 3800.22 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 4288 + - - 14 + - 4335.12 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 5888 + - - 14 + - 3744.67 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 64 + - - 6 + - 1820.7 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 64 + - - 6 + - 3311.04 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 256 + - - 6 + - 2406.33 + - - - 64 + - 5888 + - 1 + - 128 + - 64 + - 64 + - 128 + - 5888 + - - 2 + - 459.551 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 448 + - - 18 + - 3261.15 + - - - 5888 + - 1024 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 1024 + - - 3 + - 1486.43 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 2944 + - - 14 + - 4327.23 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 4288 + - - 14 + - 4079.0 + - - - 128 + - 128 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 2 + - 24.8242 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1408 + - - 14 + - 4148.84 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 128 + - - 10 + - 2487.01 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 4 + - - 26 + - 173.019 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 448 + - - 6 + - 2533.32 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1856 + - - 26 + - 82.3935 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 448 + - - 6 + - 3006.16 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 2368 + - - 14 + - 3958.7 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 128 + - - 6 + - 1927.86 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3584 + - - 16 + - 4128.97 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 256 + - 704 + - - 6 + - 1572.05 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 2944 + - - 14 + - 4052.77 + - - - 128 + - 1024 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1024 + - - 2 + - 192.753 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1856 + - - 26 + - 155.564 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 4288 + - - 14 + - 3844.0 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1024 + - - 26 + - 92.5837 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 5888 + - - 14 + - 4439.56 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 4288 + - - 14 + - 4223.36 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1408 + - - 21 + - 1963.16 + - - - 1856 + - 6784 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 6784 + - - 4 + - 2107.3 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 256 + - 64 + - - 28 + - 1.68214 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1408 + - - 6 + - 3221.42 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 5888 + - - 14 + - 4418.72 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 2368 + - - 14 + - 4154.2 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 256 + - - 14 + - 3357.33 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 5888 + - - 6 + - 2939.2 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 256 + - 2944 + - - 6 + - 1065.25 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 5056 + - - 14 + - 4209.84 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 704 + - - 18 + - 3873.6 + - - - 1408 + - 5056 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 5056 + - - 3 + - 1828.28 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 4 + - - 26 + - 131.073 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1856 + - - 6 + - 979.662 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 64 + - - 6 + - 773.77 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 2944 + - - 6 + - 3364.88 + - - - 1408 + - 128 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 2 + - 259.549 + - - - 64 + - 3584 + - 1 + - 128 + - 64 + - 64 + - 128 + - 3584 + - - 2 + - 310.23 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 768 + - 128 + - - 6 + - 771.012 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 4 + - - 26 + - 64.8804 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 6784 + - - 14 + - 4264.23 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1024 + - - 16 + - 4073.76 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 4 + - - 24 + - 104.693 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 64 + - - 6 + - 1239.87 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 3584 + - - 14 + - 4231.49 + - - - 2368 + - 2368 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 2368 + - - 3 + - 1930.68 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 2368 + - - 7 + - 2678.24 + - - - 4 + - 5056 + - 1 + - 128 + - 4 + - 4 + - 128 + - 5056 + - - 23 + - 44.3878 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1408 + - - 6 + - 2735.11 + - - - 2944 + - 704 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 704 + - - 3 + - 1162.33 + - - - 4288 + - 2368 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 2368 + - - 3 + - 2005.23 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1408 + - - 14 + - 3959.2 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 5888 + - - 14 + - 3975.22 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 64 + - - 13 + - 666.972 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 256 + - 4 + - - 29 + - 9.47835 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 2944 + - - 6 + - 3646.63 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1856 + - - 6 + - 3150.96 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 2944 + - - 14 + - 4197.61 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 768 + - 2368 + - - 26 + - 98.8383 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 256 + - - 12 + - 2550.38 + - - - 4288 + - 5888 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 5888 + - - 3 + - 2271.12 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 4 + - - 24 + - 96.6558 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 256 + - 448 + - - 17 + - 364.813 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1408 + - - 14 + - 3841.47 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 6784 + - - 14 + - 4167.19 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 2944 + - - 6 + - 2851.7 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 5888 + - - 14 + - 3847.57 + - - - 2368 + - 6784 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 6784 + - - 3 + - 2206.67 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1024 + - - 5 + - 1466.15 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5888 + - - 14 + - 2676.72 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1408 + - - 14 + - 4049.32 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 4 + - - 26 + - 96.496 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 5056 + - - 14 + - 4309.54 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 704 + - - 6 + - 3450.18 + - - - 2368 + - 256 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 256 + - - 2 + - 706.433 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 256 + - 2368 + - - 28 + - 40.4678 + - - - 4288 + - 1408 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 1408 + - - 3 + - 1817.16 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 768 + - 4288 + - - 25 + - 158.022 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 5888 + - - 14 + - 4440.15 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 3584 + - - 14 + - 3824.23 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 256 + - - 14 + - 2749.03 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 128 + - - 6 + - 3511.33 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1408 + - - 14 + - 3857.79 + - - - 6784 + - 2368 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 2368 + - - 3 + - 2136.24 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 5056 + - - 14 + - 4166.78 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5056 + - - 6 + - 2490.6 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 256 + - 128 + - - 17 + - 107.436 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 5888 + - - 14 + - 3729.95 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 128 + - - 6 + - 1858.03 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1856 + - - 14 + - 3523.05 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 768 + - 2944 + - - 25 + - 118.501 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1024 + - - 26 + - 135.449 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 4288 + - - 6 + - 3371.23 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 5888 + - - 14 + - 4152.54 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1024 + - - 16 + - 3911.83 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 704 + - - 6 + - 2511.23 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 6 + - 2348.81 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 5056 + - - 14 + - 4204.58 + - - - 4 + - 4 + - 1 + - 128 + - 4 + - 4 + - 128 + - 4 + - - 23 + - 0.0339976 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1408 + - - 7 + - 2521.34 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 768 + - 256 + - - 17 + - 562.239 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1024 + - - 12 + - 1222.83 + - - - 128 + - 64 + - 1 + - 128 + - 128 + - 128 + - 128 + - 64 + - - 2 + - 12.4239 + - - - 6784 + - 1856 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 1856 + - - 3 + - 2059.9 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1856 + - - 18 + - 4043.31 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 256 + - - 14 + - 3296.31 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 256 + - 128 + - - 6 + - 555.604 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 704 + - - 6 + - 2588.64 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 448 + - - 6 + - 2982.7 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 704 + - - 16 + - 3414.55 + - - - 1024 + - 5056 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 5056 + - - 4 + - 1525.84 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 128 + - - 10 + - 2334.7 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 5888 + - - 14 + - 4255.07 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 704 + - - 16 + - 3762.02 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 4288 + - - 5 + - 2247.76 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 768 + - 3584 + - - 6 + - 3179.8 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 128 + - - 6 + - 3288.44 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1024 + - - 14 + - 3922.5 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 704 + - - 6 + - 2146.1 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 768 + - 704 + - - 6 + - 1979.17 + - - - 3584 + - 4 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 4 + - - 22 + - 32.9093 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 3584 + - - 14 + - 4167.9 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 5888 + - - 14 + - 4135.56 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 3584 + - - 14 + - 3526.1 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 448 + - - 6 + - 3481.88 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 64 + - - 6 + - 553.471 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 768 + - 256 + - - 8 + - 142.47 + - - - 1024 + - 1856 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 1856 + - - 4 + - 1211.02 + - - - 4288 + - 1856 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 1856 + - - 3 + - 1905.95 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 768 + - 6784 + - - 6 + - 2845.11 + - - - 256 + - 5888 + - 1 + - 128 + - 256 + - 256 + - 128 + - 5888 + - - 4 + - 841.789 + - - - 704 + - 5888 + - 1 + - 128 + - 704 + - 704 + - 128 + - 5888 + - - 3 + - 1638.81 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 5888 + - - 14 + - 4209.39 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 704 + - - 6 + - 3413.65 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 5056 + - - 14 + - 4340.31 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 256 + - 4 + - - 25 + - 3.25726 + - - - 448 + - 4288 + - 1 + - 128 + - 448 + - 448 + - 128 + - 4288 + - - 4 + - 1417.73 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 2368 + - - 10 + - 2400.83 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1856 + - - 6 + - 3779.2 + - - - 2368 + - 704 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 704 + - - 3 + - 1337.0 + - - - 5056 + - 1408 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 1408 + - - 1 + - 1943.71 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 128 + - - 6 + - 2748.28 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 4 + - - 25 + - 168.114 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 256 + - 448 + - - 28 + - 9.41609 + - - - 2944 + - 448 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 448 + - - 3 + - 1000.12 + - - - 4 + - 2368 + - 1 + - 128 + - 4 + - 4 + - 128 + - 2368 + - - 22 + - 21.0491 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 1035.4 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1408 + - - 14 + - 3806.17 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 704 + - - 16 + - 3949.24 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 3584 + - - 14 + - 4233.23 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1408 + - - 14 + - 3365.77 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 256 + - 4288 + - - 6 + - 1365.76 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1856 + - - 6 + - 3329.36 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 4 + - - 26 + - 67.3915 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1856 + - - 14 + - 3188.1 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 6784 + - - 14 + - 4460.5 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 256 + - - 14 + - 3844.35 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 768 + - 704 + - - 6 + - 1485.11 + - - - 5056 + - 448 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 448 + - - 4 + - 1343.77 + - - - 6784 + - 704 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 704 + - - 3 + - 1772.56 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 2368 + - - 12 + - 2382.29 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 2368 + - - 14 + - 3920.37 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 128 + - - 6 + - 2191.05 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 448 + - - 10 + - 2753.19 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 256 + - 448 + - - 6 + - 1559.9 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 2944 + - - 6 + - 2894.43 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 4 + - - 24 + - 114.729 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 256 + - - 7 + - 2453.31 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 128 + - - 17 + - 212.693 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1024 + - - 14 + - 4234.97 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 256 + - 6784 + - - 14 + - 2993.4 + - - - 4 + - 128 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 22 + - 1.12994 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 6784 + - - 14 + - 4278.9 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 4 + - - 29 + - 181.46 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1408 + - - 6 + - 2660.31 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 4 + - - 26 + - 65.8553 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 5056 + - - 14 + - 3919.88 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1408 + - - 14 + - 3974.25 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 256 + - 2368 + - - 6 + - 884.975 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 3584 + - - 14 + - 4458.34 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 6784 + - - 14 + - 4503.64 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1408 + - - 14 + - 2638.89 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 5056 + - - 6 + - 3383.68 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 2944 + - - 14 + - 3778.86 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 689.853 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1024 + - - 16 + - 4142.52 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 5888 + - - 14 + - 4114.08 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 6784 + - - 14 + - 4210.19 + - - - 3584 + - 3584 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 3584 + - - 4 + - 1787.76 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 4 + - - 24 + - 67.877 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 768 + - 256 + - - 26 + - 15.147 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 4 + - - 26 + - 0.470341 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 6784 + - - 14 + - 4442.22 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 704 + - - 5 + - 2582.05 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3584 + - - 6 + - 3561.79 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 256 + - - 6 + - 2846.41 + - - - 1856 + - 4288 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 4288 + - - 3 + - 1925.26 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1024 + - - 18 + - 3593.02 + - - - 256 + - 2944 + - 1 + - 128 + - 256 + - 256 + - 128 + - 2944 + - - 2 + - 628.381 + - - - 704 + - 1856 + - 1 + - 128 + - 704 + - 704 + - 128 + - 1856 + - - 3 + - 1019.31 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 64 + - - 5 + - 1883.08 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 4288 + - - 14 + - 3453.09 + - - - 5056 + - 4 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 4 + - - 22 + - 46.4924 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 5888 + - - 14 + - 4243.3 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 6784 + - - 14 + - 4423.66 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 4288 + - - 15 + - 2207.68 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 4288 + - - 6 + - 2818.88 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1408 + - - 6 + - 554.535 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 2944 + - - 14 + - 4090.91 + - - - 3584 + - 1024 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 1024 + - - 4 + - 1365.91 + - - - 6784 + - 448 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 448 + - - 1 + - 1454.61 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 4 + - - 26 + - 39.7003 + - - - 4 + - 1024 + - 1 + - 128 + - 4 + - 4 + - 128 + - 1024 + - - 23 + - 9.34901 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4288 + - - 6 + - 2314.05 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 6784 + - - 6 + - 3378.55 + - - - 5056 + - 64 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 64 + - - 2 + - 421.951 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 5888 + - - 14 + - 4365.29 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 3584 + - - 16 + - 4031.21 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 4 + - - 25 + - 203.742 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1856 + - - 18 + - 3916.08 + - - - 5888 + - 1856 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 1856 + - - 4 + - 1818.52 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 3584 + - - 14 + - 4133.01 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1856 + - - 6 + - 2547.96 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 5056 + - - 14 + - 3944.87 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 256 + - 448 + - - 6 + - 1122.82 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 4288 + - - 16 + - 4356.68 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1856 + - - 16 + - 4130.38 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 704 + - - 6 + - 3118.74 + - - - 704 + - 1024 + - 1 + - 128 + - 704 + - 704 + - 128 + - 1024 + - - 2 + - 813.997 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 2944 + - - 14 + - 4112.91 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 64 + - - 6 + - 894.772 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 256 + - 5888 + - - 6 + - 1786.46 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 64 + - - 6 + - 1804.93 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 4288 + - - 14 + - 4305.44 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 6784 + - - 6 + - 3380.28 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 704 + - - 6 + - 1959.96 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1024 + - - 16 + - 3444.88 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 768 + - 2944 + - - 6 + - 3181.95 + - - - 64 + - 448 + - 1 + - 128 + - 64 + - 64 + - 128 + - 448 + - - 2 + - 42.5954 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 128 + - - 6 + - 1510.8 + - - - 4288 + - 448 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 448 + - - 3 + - 1419.04 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 6784 + - - 14 + - 4189.55 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1408 + - - 14 + - 4257.5 + - - - 448 + - 5056 + - 1 + - 128 + - 448 + - 448 + - 128 + - 5056 + - - 3 + - 1355.83 + - - - 3584 + - 5056 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 5056 + - - 4 + - 1979.33 + - - - 1856 + - 5888 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 5888 + - - 1 + - 2091.51 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 4288 + - - 14 + - 4300.73 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 768 + - 64 + - - 17 + - 392.502 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1856 + - - 6 + - 1878.63 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 256 + - - 9 + - 391.484 + - - - 448 + - 4 + - 1 + - 128 + - 448 + - 448 + - 128 + - 4 + - - 22 + - 4.39085 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 4288 + - - 14 + - 4042.25 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 448 + - - 14 + - 3411.7 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 64 + - - 5 + - 1318.51 + - - - 1408 + - 5888 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 5888 + - - 3 + - 1882.83 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 768 + - 3584 + - - 12 + - 1691.25 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 256 + - 5056 + - - 14 + - 3358.94 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 256 + - 6784 + - - 14 + - 3913.7 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1856 + - - 18 + - 3958.11 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1856 + - - 14 + - 3954.34 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 256 + - - 6 + - 3640.08 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1856 + - - 6 + - 3139.23 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 768 + - 448 + - - 26 + - 24.7172 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 4288 + - - 14 + - 3951.93 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 4288 + - - 14 + - 4229.92 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 704 + - - 6 + - 2310.26 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1856 + - - 14 + - 3792.69 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 768 + - 256 + - - 17 + - 285.456 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 704 + - - 12 + - 2801.05 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 704 + - - 26 + - 67.6807 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 4288 + - - 6 + - 3680.17 + - - - 128 + - 6784 + - 1 + - 128 + - 128 + - 128 + - 128 + - 6784 + - - 2 + - 837.975 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 704 + - - 14 + - 3474.57 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 768 + - 6784 + - - 24 + - 204.64 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 768 + - 6784 + - - 14 + - 3530.04 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 128 + - - 26 + - 20.5789 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 448 + - - 6 + - 3301.27 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1856 + - - 14 + - 4279.93 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1408 + - - 6 + - 3645.25 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 256 + - - 11 + - 782.103 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1024 + - - 14 + - 3578.29 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 4288 + - - 14 + - 4353.68 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1856 + - - 14 + - 3270.0 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 2368 + - - 14 + - 4064.93 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1408 + - - 6 + - 2761.45 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 256 + - 2944 + - - 6 + - 2537.89 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 256 + - 5888 + - - 14 + - 3450.7 + - - - 1408 + - 4 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 4 + - - 22 + - 13.3106 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4 + - - 26 + - 5.80993 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 256 + - 6784 + - - 6 + - 2124.41 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1024 + - - 14 + - 3360.12 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 4 + - - 24 + - 82.9858 + - - - 448 + - 64 + - 1 + - 128 + - 448 + - 448 + - 128 + - 64 + - - 2 + - 41.5536 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 64 + - - 19 + - 86.8026 + - - - 256 + - 6784 + - 1 + - 128 + - 256 + - 256 + - 128 + - 6784 + - - 4 + - 1128.19 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 256 + - - 10 + - 3293.34 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 704 + - - 6 + - 2674.29 + - - - 6784 + - 5888 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 5888 + - - 3 + - 2291.94 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 256 + - 448 + - - 17 + - 185.73 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 5888 + - - 14 + - 4196.68 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 128 + - - 6 + - 773.857 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 64 + - - 6 + - 2889.09 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 6784 + - - 14 + - 4416.18 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1408 + - - 26 + - 64.5964 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 2944 + - - 18 + - 3911.1 + - - - 704 + - 2368 + - 1 + - 128 + - 704 + - 704 + - 128 + - 2368 + - - 3 + - 1279.29 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 128 + - - 6 + - 1492.8 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 256 + - - 6 + - 3491.81 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 3584 + - - 12 + - 2023.64 + - - - 256 + - 704 + - 1 + - 128 + - 256 + - 256 + - 128 + - 704 + - - 2 + - 253.837 + - - - 704 + - 448 + - 1 + - 128 + - 704 + - 704 + - 128 + - 448 + - - 2 + - 418.431 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 64 + - - 11 + - 1056.26 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 64 + - - 8 + - 273.678 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1408 + - - 16 + - 3733.68 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 4 + - - 29 + - 85.4561 + - - - 1024 + - 448 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 448 + - - 2 + - 524.288 + - - - 4288 + - 1024 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 1024 + - - 3 + - 1680.33 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 768 + - 6784 + - - 6 + - 3315.91 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 2944 + - - 14 + - 4143.93 + - - - 1408 + - 2368 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 2368 + - - 1 + - 1529.87 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 5888 + - - 14 + - 4143.37 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 256 + - - 11 + - 1136.43 + - - - 5888 + - 128 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 2 + - 793.853 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1024 + - - 14 + - 3841.0 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 64 + - - 17 + - 408.006 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2368 + - - 6 + - 1876.08 + - - - 448 + - 5888 + - 1 + - 128 + - 448 + - 448 + - 128 + - 5888 + - - 4 + - 1484.01 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 704 + - - 14 + - 3667.12 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 64 + - - 11 + - 967.458 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 2368 + - - 14 + - 4284.79 + - - - 704 + - 64 + - 1 + - 128 + - 704 + - 704 + - 128 + - 64 + - - 2 + - 64.8288 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 4288 + - - 14 + - 3888.22 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 64 + - - 6 + - 2386.66 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 4288 + - - 14 + - 3815.81 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1024 + - - 6 + - 3342.81 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 5056 + - - 7 + - 2813.78 + - - - 256 + - 2368 + - 1 + - 128 + - 256 + - 256 + - 128 + - 2368 + - - 2 + - 549.226 + - - - 2368 + - 4288 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 4288 + - - 3 + - 2038.44 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1024 + - - 14 + - 3753.73 + - - - 4 + - 1856 + - 1 + - 128 + - 4 + - 4 + - 128 + - 1856 + - - 22 + - 16.5439 + - - - 5888 + - 6784 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 6784 + - - 4 + - 2078.06 + - - - 5056 + - 256 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 256 + - - 3 + - 983.351 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 4288 + - - 18 + - 4121.48 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 256 + - - 26 + - 40.764 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 3584 + - - 6 + - 3451.82 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 4 + - - 26 + - 124.415 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 4288 + - - 10 + - 3468.87 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 704 + - - 18 + - 3772.65 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 4288 + - - 18 + - 3925.89 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1024 + - - 17 + - 564.256 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 2944 + - - 18 + - 4067.41 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 4 + - - 26 + - 0.655768 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3584 + - - 14 + - 3859.06 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 448 + - - 12 + - 2291.16 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1856 + - - 6 + - 3497.55 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 448 + - - 6 + - 2337.78 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 2944 + - - 12 + - 1721.96 + - - - 5888 + - 2944 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 2944 + - - 3 + - 1793.74 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1024 + - - 14 + - 3589.57 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 3584 + - - 14 + - 4256.09 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 768 + - 5888 + - - 14 + - 3117.94 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 128 + - - 19 + - 145.636 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 256 + - - 6 + - 1683.49 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3584 + - - 18 + - 3951.38 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1024 + - - 14 + - 3278.18 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 448 + - - 6 + - 2293.76 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 768 + - 256 + - - 6 + - 1487.66 + - - - 1408 + - 4288 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 4288 + - - 3 + - 1788.56 + - - - 2368 + - 4 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 4 + - - 22 + - 21.8377 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 2368 + - - 14 + - 3825.21 + - - - 3584 + - 256 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 256 + - - 2 + - 870.704 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1024 + - - 6 + - 3161.86 + - - - 1408 + - 256 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 256 + - - 2 + - 462.855 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 448 + - - 18 + - 3810.3 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1856 + - - 14 + - 3378.74 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 448 + - - 10 + - 2473.66 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 5888 + - - 25 + - 350.292 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 2368 + - - 14 + - 3857.82 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 448 + - - 14 + - 3300.17 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 256 + - 128 + - - 17 + - 52.6394 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 2368 + - - 14 + - 4144.19 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 448 + - - 6 + - 3238.59 + - - - 2944 + - 5888 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 5888 + - - 1 + - 2121.21 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 448 + - - 6 + - 685.984 +- null diff --git a/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml new file mode 100644 index 000000000..2aee7dfa1 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml @@ -0,0 +1,19239 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x64x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 32 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 32 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 4 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 16 + LSPB: 16 + LVCA: 4 + LVCB: 4 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 64 + LVCA: 8 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 32 + LVCA: 4 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x32x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 9 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 10 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU8_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 11 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x128x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 12 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 13 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 32 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 14 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 64 + LVCA: 8 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 15 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 64 + LVCA: 8 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 16 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 17 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 18 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 32 + LVCA: 4 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 19 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x32x16_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 32 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 20 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 21 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 32 + LVCA: 4 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 22 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x32x16_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 2 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 4 + LSCB: 4 + LSPA: 16 + LSPB: 16 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 23 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT16x16x4_SE_AMAS2_GRVW2_GSU1_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 4 + LSCB: 4 + LSPA: 16 + LSPB: 16 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 24 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT16x16x4_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 25 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 26 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU4_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 27 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU8_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 28 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 29 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 30 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 12 + - 2943.57 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 4030.09 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 14 + - 2175.48 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 8 + - 3058.29 + - - - 3584 + - 4288 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2020.31 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 12 + - 2918.47 + - - - 4 + - 3584 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 33.0993 + - - - 5056 + - 1856 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2128.18 + - - - 3584 + - 2368 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1823.18 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3301.5 + - - - 128 + - 4 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 23 + - 1.26812 + - - - 64 + - 1024 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 84.223 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 2912.71 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 13 + - 3954.96 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 27 + - 67.4635 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 15 + - 1769.49 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 13 + - 3795.25 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 13 + - 3309.12 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 11 + - 3898.8 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 316.927 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 27 + - 28.1789 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 11 + - 3885.39 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2938.06 + - - - 256 + - 2368 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 570.549 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 13 + - 4257.51 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 25 + - 117.715 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 13 + - 3791.67 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 27 + - 36.0448 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 126.64 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 8 + - 1840.72 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 30 + - 65.0705 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 2925.5 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 12 + - 3041.21 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 4076.21 + - - - 2368 + - 3584 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2093.92 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 26 + - 24.9618 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 1583.2 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 30 + - 63.9092 + - - - 5056 + - 256 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 950.407 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3919.67 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4014.64 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 17 + - 3871.78 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 2962.39 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3884.3 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 28 + - 65.1178 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 2657.68 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 12 + - 2601.64 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 12 + - 2644.21 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 8 + - 2748.88 + - - - 6784 + - 1408 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2037.19 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4051.46 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3964.71 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 1125.21 + - - - 1408 + - 4288 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1802.58 + - - - 1408 + - 3584 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1707.71 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 13 + - 4045.69 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 13 + - 3092.05 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 17 + - 3493.15 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 8 + - 3326.29 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 26 + - 40.8496 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4134.11 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 13 + - 3655.82 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 13 + - 4280.89 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 11 + - 3407.39 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 11 + - 3507.78 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3446.52 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3706.31 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 6 + - 1127.5 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2004.76 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 11 + - 3764.68 + - - - 5888 + - 1408 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1861.42 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 13 + - 3881.64 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1046.67 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 17 + - 3968.68 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 17 + - 3432.04 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 8 + - 2996.75 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3735.99 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 27 + - 193.541 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 3111.93 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3682.09 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 8 + - 2610.56 + - - - 128 + - 1856 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 277.654 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 8 + - 2048.69 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4169.73 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3872.86 + - - - 2368 + - 1856 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1784.32 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 13 + - 4098.87 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3255.82 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 26 + - 67.9287 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 1292.26 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 8 + - 1898.88 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3480.58 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 12 + - 3009.91 + - - - 4 + - 2944 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 27.0715 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 12 + - 2618.13 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 17.9305 + - - - 1408 + - 2944 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1623.96 + - - - 448 + - 5888 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1622.03 + - - - 1856 + - 256 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 3 + - 531.993 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 5 + - 1602.99 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 8 + - 1670.56 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 17 + - 4025.95 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 2814.72 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 27 + - 206.72 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 8 + - 1715.31 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 18 + - 682.37 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2944.46 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 13 + - 3702.04 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 11 + - 3532.77 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3313.75 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 8 + - 3023.9 + - - - 128 + - 5056 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 625.661 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4097.22 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 11 + - 3194.21 + - - - 5888 + - 1024 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1765.54 + - - - 4 + - 4288 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 39.261 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 3342.61 + - - - 704 + - 4288 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1489.36 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 12 + - 2740.23 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 12 + - 2594.05 + - - - 64 + - 64 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 5.116 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 13 + - 4012.71 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 8 + - 3246.64 + - - - 4 + - 704 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 6.40006 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2830.09 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 91.8428 + - - - 5888 + - 2944 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2074.41 + - - - 256 + - 2944 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 4 + - 680.893 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4142.97 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 1848.45 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 3965.71 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 2240.26 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 17 + - 3486.99 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 13 + - 3178.98 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 3044.44 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 3940.45 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 20 + - 2643.46 + - - - 128 + - 256 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 41.1206 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 17 + - 3247.06 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 12 + - 3130.08 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 29 + - 94.6214 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 12 + - 3244.21 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 13 + - 4014.32 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 1858.66 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 17 + - 3954.88 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 7.8019 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 25 + - 68.3061 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 11 + - 3315.82 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 26 + - 192.543 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 2967.67 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 18 + - 172.463 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 11 + - 3751.87 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 2316.85 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4137.71 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 13 + - 3712.17 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 29 + - 132.972 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 3308.8 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 3301.03 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 483.624 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3509.71 + - - - 4288 + - 64 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 3 + - 324.772 + - - - 128 + - 4288 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 530.624 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3743.18 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 30 + - 1.64498 + - - - 256 + - 704 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 215.193 + - - - 4288 + - 1856 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 1993.68 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3646.66 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3562.96 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4401.47 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 11 + - 3923.75 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 26 + - 170.936 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 26 + - 194.298 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 2000.01 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 39.7373 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 12 + - 3355.2 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 8 + - 1718.16 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 17 + - 3307.9 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 13 + - 3933.26 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 17 + - 3591.48 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 3946.89 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 1432.24 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3772.77 + - - - 2944 + - 64 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 3 + - 226.496 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 27 + - 4.33439 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1750.78 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 348.259 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 17 + - 3814.29 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 3277.49 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 2535.08 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 8 + - 1200.09 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 92.084 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 8 + - 2466.36 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 11 + - 3446.52 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 11 + - 3628.42 + - - - 3584 + - 1856 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1793.87 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 13 + - 3389.72 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3555.34 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 785.15 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 12 + - 2117.41 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 8 + - 2898.71 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3844.44 + - - - 4288 + - 4 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 23 + - 39.487 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 12 + - 3197.32 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3735.71 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2156.78 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 13 + - 3923.21 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 13 + - 3768.93 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 27 + - 7.77019 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1338.33 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 11 + - 3775.83 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3715.56 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 11 + - 3788.54 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 8 + - 1385.62 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 4089.55 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3546.84 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 18 + - 1869.05 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 11 + - 3590.44 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 17 + - 2813.62 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4200.33 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3429.92 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 453.174 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 8 + - 1288.5 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 2757.93 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 3843.19 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 3265.82 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 18 + - 221.619 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 13 + - 3866.96 + - - - 4 + - 5888 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 53.6802 + - - - 1856 + - 5056 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 2132.41 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4091.25 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 25 + - 129.91 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 3174.83 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 1321.81 + - - - 1024 + - 3584 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1464.35 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 2964.17 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 988.505 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 48.0117 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 1347.95 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3940.81 + - - - 4288 + - 1024 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 1778.6 + - - - 1408 + - 256 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 3 + - 427.514 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3841.81 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 7 + - 2221.25 + - - - 1408 + - 6784 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 2040.18 + - - - 6784 + - 448 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 1 + - 1378.73 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 25 + - 158.538 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 3860.23 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 63.1672 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 18 + - 349.914 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 11 + - 3614.13 + - - - 1856 + - 2944 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1932.9 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 5 + - 92.9589 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 477.415 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 8 + - 2880.06 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 3101.47 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 12 + - 2990.64 + - - - 1856 + - 4288 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1988.7 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 27.8877 + - - - 2368 + - 6784 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2192.74 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 11 + - 3607.21 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 11 + - 3719.54 + - - - 2944 + - 4 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 23 + - 27.1495 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 936.229 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 17 + - 3540.88 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 27 + - 46.2452 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3489.34 + - - - 5888 + - 256 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1044.49 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2911.28 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 97.5212 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 639.376 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 12 + - 2602.85 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 534.988 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 27 + - 13.1743 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 13 + - 3359.6 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 12 + - 2427.02 + - - - 2368 + - 5888 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2166.5 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3192.58 + - - - 1856 + - 64 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 3 + - 145.413 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 30 + - 35.0176 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 998.767 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 27 + - 20.2464 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 22 + - 2233.92 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 20 + - 2886.11 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 11 + - 3791.37 + - - - 5056 + - 1408 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 1987.81 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 4079.08 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3323.76 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2139.32 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 2447.1 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2941.67 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 18 + - 756.704 + - - - 1024 + - 1408 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 937.37 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4177.95 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 12 + - 2873.17 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 8 + - 2099.84 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 11 + - 3976.61 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 26 + - 151.063 + - - - 448 + - 1024 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 515.452 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 24.2237 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 18 + - 905.838 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 22 + - 1865.77 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 2550.54 + - - - 128 + - 1024 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 170.778 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3184.28 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 27 + - 38.6205 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 2334.44 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 11 + - 3764.82 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 12 + - 3194.39 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 12 + - 2523.29 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 174.066 + - - - 1408 + - 2368 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1575.96 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3723.65 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 11 + - 3893.92 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 14.39 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 2778.39 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 22 + - 1923.8 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 13 + - 4049.68 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 3303.38 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 30 + - 18.2046 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 5 + - 720.671 + - - - 4 + - 256 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 2.35404 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 14 + - 2211.45 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 8 + - 2139.95 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 2988.92 + - - - 704 + - 1024 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 726.344 + - - - 4288 + - 128 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 548.864 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 17 + - 3815.7 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 15 + - 1505.39 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 2359.49 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 13 + - 3979.44 + - - - 1408 + - 1024 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1059.17 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 13 + - 3405.1 + - - - 64 + - 4 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 23 + - 0.629192 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 3422.91 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3285.08 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 12 + - 3203.64 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 11 + - 3495.53 + - - - 1024 + - 448 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 474.162 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 8 + - 1926.65 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 18 + - 796.874 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 1878.67 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 8 + - 2248.16 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 8 + - 2559.45 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 13 + - 3923.01 + - - - 704 + - 2368 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1317.84 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 11 + - 3474.2 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 13 + - 3847.74 + - - - 4288 + - 704 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 1503.74 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 3794.06 + - - - 2944 + - 1856 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1832.43 + - - - 1024 + - 1024 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 732.95 + - - - 2368 + - 704 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1245.25 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 88.9917 + - - - 128 + - 704 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 117.986 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4231.37 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 8 + - 1516.22 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 3812.62 + - - - 5888 + - 6784 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2176.35 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 436.907 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 12 + - 2484.61 + - - - 64 + - 4288 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 319.107 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 8 + - 1971.66 + - - - 64 + - 128 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 10.1922 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 4037.68 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 25 + - 63.0823 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 11 + - 4012.7 + - - - 4 + - 6784 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 62.1144 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 956.291 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 8 + - 2949.99 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 8 + - 1433.6 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 4359.14 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 8 + - 2980.96 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 11 + - 3775.0 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 18 + - 128.188 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 8 + - 2585.42 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 17 + - 3962.38 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 6 + - 1908.51 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 17 + - 3907.43 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 11 + - 3816.24 + - - - 1024 + - 4 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 23 + - 9.72353 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 17 + - 3438.44 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 14 + - 2213.28 + - - - 64 + - 1856 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 151.801 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 1336.09 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3415.04 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 2138.05 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 2501.83 + - - - 64 + - 256 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 20.5281 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2047.74 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 12 + - 2954.17 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 12 + - 1473.34 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 3179.73 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 17 + - 3366.06 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 11 + - 3922.94 + - - - 4288 + - 448 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 2 + - 1388.9 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 3823.0 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 257.635 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 29 + - 32.3662 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 17 + - 3366.39 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 11 + - 3894.22 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 17 + - 2788.62 + - - - 128 + - 2368 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 354.249 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 29 + - 39.8297 + - - - 3584 + - 5888 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2092.35 + - - - 3584 + - 1024 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1506.42 + - - - 4288 + - 3584 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2219.44 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 3422.66 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 11 + - 3504.78 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 12 + - 3272.27 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 773.857 + - - - 6784 + - 2944 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2134.34 + - - - 448 + - 4288 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1477.0 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 2538.1 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 8 + - 2831.43 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 27 + - 103.448 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3506.5 + - - - 3584 + - 4 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 24 + - 33.0516 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 3872.85 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 4317.51 + - - - 704 + - 128 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 3 + - 113.259 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 1675.81 + - - - 5056 + - 64 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 3 + - 370.339 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 1603.9 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 3409.54 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2353.89 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 4126.96 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 18 + - 1128.08 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 13 + - 3151.21 + - - - 4 + - 448 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 4.1554 + - - - 1024 + - 2368 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1177.11 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 12 + - 2744.0 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 18 + - 1240.45 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 3988.18 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 18 + - 592.575 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 936.229 + - - - 448 + - 256 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 147.746 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 11 + - 3927.59 + - - - 6784 + - 2368 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2118.63 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 12 + - 3197.0 + - - - 2944 + - 6784 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2145.67 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 2131.79 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3928.5 + - - - 5056 + - 5056 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2232.84 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3779.49 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 29 + - 1.76172 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 11 + - 3660.47 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 6 + - 3046.49 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4119.06 + - - - 4288 + - 1408 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 1881.58 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4146.25 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 4030.37 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 637.961 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 13 + - 3358.39 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 6 + - 1541.43 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 13 + - 3460.48 + - - - 2944 + - 3584 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2036.93 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4262.56 + - - - 704 + - 1856 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1031.38 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 57.201 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 1052.4 + - - - 704 + - 5888 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1701.45 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 2590.4 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 21 + - 922.536 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 12 + - 3301.59 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4100.33 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 17 + - 3623.32 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3778.27 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 4039.82 + - - - 448 + - 1856 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 845.223 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 3951.52 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 2876.39 + - - - 5056 + - 448 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 1379.57 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 3059.56 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 2929.52 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 11 + - 3978.03 + - - - 2944 + - 2368 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1856.26 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 6 + - 1880.06 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 17 + - 3227.24 + - - - 256 + - 5056 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 803.0 + - - - 6784 + - 256 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 1285.85 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 2663.18 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 12 + - 2805.43 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 17 + - 3942.17 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3272.93 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 4032.36 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 4245.62 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 900.182 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 782.117 + - - - 2368 + - 128 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 3 + - 360.57 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 17 + - 3643.87 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 25 + - 100.828 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 17 + - 3329.81 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4150.24 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 2301.61 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2902.84 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 3375.57 + - - - 1024 + - 2944 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1258.73 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 11 + - 3896.4 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4002.09 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 11 + - 3305.3 + - - - 4288 + - 2368 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2116.79 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 2392.71 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 25 + - 107.984 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 30 + - 0.463648 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 3959.24 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 8 + - 1194.5 + - - - 704 + - 4 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 23 + - 6.76523 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 1303.98 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 3785.45 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 707.256 + - - - 64 + - 6784 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 486.472 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 4023.13 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 30 + - 0.0973384 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 18 + - 1563.73 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 17 + - 3709.14 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 13 + - 3932.49 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3976.21 + - - - 1024 + - 704 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 685.751 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 12 + - 3279.23 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 6 + - 2655.51 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 18 + - 636.553 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 8 + - 1178.18 + - - - 5888 + - 3584 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2070.91 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 11 + - 3941.22 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 8 + - 2747.77 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 3155.77 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 27 + - 194.818 + - - - 128 + - 2944 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 413.533 + - - - 5888 + - 704 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1568.28 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 8 + - 1116.96 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 66.7989 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 8 + - 1534.5 + - - - 3584 + - 5056 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2067.54 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 13 + - 4078.28 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 2892.62 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 12 + - 2911.61 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 12 + - 2938.1 + - - - 3584 + - 3584 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2006.85 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 14 + - 2163.91 + - - - 4 + - 1024 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 9.60947 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 12 + - 2134.27 + - - - 6784 + - 1856 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2043.18 + - - - 704 + - 64 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 3 + - 56.4523 + - - - 2944 + - 448 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 984.263 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 8 + - 1602.52 + - - - 448 + - 1408 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 635.951 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 12 + - 2528.87 + - - - 704 + - 448 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 3 + - 379.134 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 4081.74 + - - - 6784 + - 5888 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2254.19 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 8 + - 2082.79 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 17 + - 3376.66 + - - - 5056 + - 4 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 23 + - 46.2267 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 12 + - 2936.01 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3427.0 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 12 + - 3138.2 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 17 + - 3209.72 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 8 + - 2207.19 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4363.07 + - - - 2368 + - 4 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 23 + - 21.8692 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 12 + - 2882.31 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3292.77 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3176.36 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3334.09 + - - - 64 + - 3584 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 264.41 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 11 + - 2654.62 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 11 + - 3424.87 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 1248.3 + - - - 6784 + - 5056 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2197.39 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 6 + - 1508.6 + - - - 4288 + - 2944 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2219.83 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 27 + - 174.198 + - - - 2944 + - 5056 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2086.36 + - - - 1024 + - 1856 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1165.53 + - - - 5056 + - 4288 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2220.47 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 11 + - 3805.55 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 17 + - 3504.4 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 2501.25 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4079.5 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 1035.4 + - - - 64 + - 2368 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 187.681 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2087.01 + - - - 448 + - 64 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 36.2363 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 3319.94 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 30 + - 166.672 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 12 + - 3134.62 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 17 + - 3705.41 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 703.742 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4105.95 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 8 + - 2001.32 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3694.22 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 13 + - 3515.8 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 8 + - 2428.63 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 42.7874 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3699.64 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 6 + - 1845.71 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1135.42 + - - - 4288 + - 5888 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2285.9 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 17 + - 3528.76 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 13 + - 3408.24 + - - - 4 + - 1856 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 17.1407 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4169.2 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 12 + - 3040.19 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3033.54 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 2046.41 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 866.011 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3986.03 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 6 + - 2076.01 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 8 + - 1464.6 + - - - 2944 + - 5888 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2157.85 + - - - 4 + - 5056 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 46.2928 + - - - 2944 + - 1408 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1610.94 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 13 + - 3343.39 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 25 + - 102.591 + - - - 1408 + - 448 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 4 + - 609.453 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 17 + - 3811.33 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 17 + - 3560.04 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 29 + - 147.149 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 4089.07 + - - - 1024 + - 128 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 3 + - 162.444 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 64.9543 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 20.0746 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 30 + - 64.8543 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4245.76 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 11 + - 3497.0 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 18 + - 1692.55 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 12 + - 2641.1 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 4127.14 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 6 + - 1345.83 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 13 + - 3628.73 + - - - 704 + - 5056 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1729.98 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 16 + - 1548.03 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 26 + - 165.235 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 11 + - 3772.45 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 4027.52 + - - - 64 + - 2944 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 225.648 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2436.81 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 30 + - 80.5842 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 302.807 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4244.08 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 8 + - 2586.04 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3858.79 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 3099.6 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 11 + - 3842.95 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4051.83 + - - - 128 + - 3584 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 489.662 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 3726.34 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 13 + - 3848.18 + - - - 5888 + - 5056 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2161.14 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 12 + - 3256.34 + - - - 1408 + - 5056 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1867.24 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 4198.68 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 4150.84 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 12 + - 2925.96 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 27 + - 10.768 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 18 + - 471.688 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4204.34 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 22 + - 2244.06 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 11 + - 3807.9 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 3861.29 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 29 + - 73.8776 + - - - 3584 + - 6784 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2122.21 + - - - 256 + - 1024 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 305.707 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 4023.15 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 2922.98 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 12 + - 2979.77 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 17 + - 3500.51 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 4355.2 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 18 + - 1551.09 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 12 + - 3211.89 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 11 + - 3683.98 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 13 + - 3399.64 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 12 + - 2992.47 + - - - 3584 + - 256 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 4 + - 858.483 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3862.76 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 133.433 + - - - 448 + - 4 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 23 + - 4.40434 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4388.11 + - - - 4 + - 4 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 0.0353594 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4005.99 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 10 + - 258.172 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 7.7179 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 17 + - 3703.86 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 8 + - 1890.69 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3632.51 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 13 + - 3559.59 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 171.898 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 20 + - 2258.95 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 11 + - 3321.78 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 13 + - 3770.87 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 3972.92 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 2693.84 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 12 + - 3462.63 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 224.878 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 13 + - 3970.57 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 11 + - 3516.93 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 8 + - 2341.62 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 17 + - 3871.12 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 27 + - 24.7885 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 3240.48 + - - - 6784 + - 64 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 3 + - 503.392 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 17 + - 3087.43 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 4030.55 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 3615.11 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 18 + - 488.847 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3222.09 + - - - 5056 + - 2368 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2110.41 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 4164.62 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3196.19 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 13 + - 3616.52 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 22 + - 1780.41 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 692.657 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 27 + - 131.477 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3736.59 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 8 + - 2997.81 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 12 + - 2598.84 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 8 + - 1267.22 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 25 + - 78.2549 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 8 + - 1704.74 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3567.28 + - - - 64 + - 448 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 38.3893 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3800.43 + - - - 2944 + - 4288 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2033.86 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 4027.08 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 1028.02 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 8 + - 1960.23 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 1833.49 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 3270.14 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3992.16 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 1121.04 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 4068.92 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 8 + - 1838.74 + - - - 256 + - 256 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 81.984 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 20 + - 2415.76 + - - - 6784 + - 4288 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2209.21 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 8 + - 2469.08 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 17 + - 3599.03 + - - - 1024 + - 4288 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1517.71 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 18 + - 1286.44 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 67.1761 + - - - 6784 + - 704 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 1665.91 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 3363.58 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 1056.5 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 27 + - 179.123 + - - - 1024 + - 64 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 3 + - 82.7605 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 2947.22 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 30 + - 48.0117 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 2007.04 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2036.07 + - - - 2368 + - 2368 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1979.68 + - - - 1024 + - 5056 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1562.97 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3902.17 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3292.32 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 496.955 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2266.62 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 8 + - 1658.51 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 11 + - 3833.44 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 12 + - 3350.97 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 6 + - 3223.71 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 2382.06 + - - - 4288 + - 6784 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2287.61 + - - - 256 + - 1856 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 505.464 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 16 + - 1030.35 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1943.6 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 3098.83 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 4.28153 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3874.66 + - - - 1856 + - 1856 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1674.75 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 1396.75 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 11 + - 3691.32 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 3302.66 + - - - 3584 + - 2944 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1945.39 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3866.25 + - - - 1024 + - 6784 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1645.92 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 13 + - 3826.91 + - - - 64 + - 704 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 55.0723 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 2545.27 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1425.17 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 11 + - 3861.69 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 15 + - 1807.68 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 46.0859 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 8 + - 2019.27 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3540.4 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 3904.76 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3497.09 + - - - 2944 + - 256 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 755.553 + - - - 704 + - 6784 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1932.6 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 11 + - 4008.71 + - - - 5888 + - 5888 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2192.74 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 13 + - 4142.02 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 1965.2 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 13 + - 3857.27 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1638.4 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 3348.03 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 11 + - 3878.66 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 19 + - 1519.92 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 1057.77 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 19 + - 1518.57 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 15 + - 2147.66 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3354.98 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 12 + - 2845.11 + - - - 4288 + - 256 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 834.774 + - - - 2368 + - 1408 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1625.92 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 27 + - 64.6553 + - - - 704 + - 704 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 486.494 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 28 + - 86.9278 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 30 + - 5.67903 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 4203.84 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 2165.03 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4348.15 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 2425.53 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 27 + - 134.927 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3341.36 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 18 + - 256.376 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 12 + - 2614.82 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 17 + - 3119.18 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 26 + - 183.373 + - - - 2944 + - 128 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 3 + - 451.972 + - - - 4288 + - 5056 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2224.03 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 17 + - 3708.87 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 13 + - 4156.02 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 3250.3 + - - - 1408 + - 5888 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1957.86 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 11 + - 3867.95 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 745.559 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 2897.86 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 3982.55 + - - - 448 + - 6784 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1508.3 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 3051.36 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 2684.81 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 2903.45 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 1737.05 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 18 + - 682.37 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 11 + - 3188.42 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 18 + - 1261.17 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4050.28 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3420.66 + - - - 4 + - 1408 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 12.4122 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1358.45 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 3646.2 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 8 + - 2643.9 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 1433.6 + - - - 5888 + - 448 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 2 + - 1265.9 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 12 + - 3044.65 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 11 + - 3808.28 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 2378.22 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 3981.55 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 22 + - 2396.49 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 8 + - 2102.95 + - - - 448 + - 3584 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1277.48 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 7 + - 2826.19 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 2384.26 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 17 + - 3302.6 + - - - 256 + - 3584 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 774.674 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 26 + - 66.9749 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2691.66 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3638.34 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3490.16 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 17 + - 3438.97 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2674.6 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 13 + - 3831.25 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 3338.3 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 711.084 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 4391.67 + - - - 4288 + - 4288 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2232.95 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 8 + - 1757.12 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 146.777 + - - - 2368 + - 4288 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2101.73 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 30 + - 70.3341 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 12 + - 3158.95 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2648.0 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 126.334 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 2816.69 + - - - 5888 + - 64 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 3 + - 449.278 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 1680.12 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 3788.44 + - - - 5888 + - 1856 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1951.45 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 18 + - 629.604 + - - - 3584 + - 128 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 3 + - 506.558 + - - - 5056 + - 128 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 650.42 + - - - 2944 + - 2944 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2027.7 + - - - 1856 + - 1408 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1610.01 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 8 + - 1534.39 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 17 + - 3655.81 + - - - 2368 + - 256 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 608.872 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 17 + - 3941.92 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 63.3198 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 22 + - 1777.04 + - - - 1856 + - 6784 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 2231.48 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 30 + - 80.7835 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 13 + - 3949.4 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 6 + - 2472.18 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 13 + - 4056.65 + - - - 1856 + - 448 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 814.685 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3735.52 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 8 + - 1681.82 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 4266.96 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 13 + - 3813.49 + - - - 1408 + - 4 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 23 + - 13.213 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 3308.43 + - - - 5056 + - 3584 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2238.34 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 11 + - 3751.09 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 11 + - 3156.68 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 1076.66 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 27.7695 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 8 + - 2183.71 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3981.7 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 11 + - 2973.77 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 11 + - 3721.45 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 3106.56 + - - - 256 + - 448 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 146.449 + - - - 128 + - 6784 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 773.157 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3759.52 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 27 + - 167.95 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 17 + - 3745.47 + - - - 5056 + - 2944 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2170.2 + - - - 2368 + - 448 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 844.469 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 12 + - 2113.69 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 18 + - 303.14 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 17 + - 3129.61 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 30 + - 205.209 + - - - 2368 + - 5056 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2121.4 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2471.5 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 9 + - 2525.06 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 13 + - 4106.76 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 20 + - 1995.87 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 3007.74 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 27 + - 9.30909 + - - - 5888 + - 2368 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2023.26 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 12 + - 3174.08 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 14.9171 + - - - 1856 + - 1024 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1435.05 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3869.61 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2933.5 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 20 + - 2101.52 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2379.93 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 8 + - 2393.26 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 967.458 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4033.91 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 12 + - 2641.32 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 18 + - 766.984 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 2918.81 + - - - 5056 + - 6784 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 1 + - 2324.24 + - - - 1856 + - 128 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 3 + - 286.011 + - - - 256 + - 64 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 20.7228 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 12 + - 2854.86 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 1786.25 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 11 + - 3917.33 + - - - 64 + - 1408 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 117.505 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3590.65 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 29 + - 3.25726 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 13 + - 3886.13 + - - - 448 + - 128 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 70.6316 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 6 + - 1149.45 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 18 + - 351.871 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 165.914 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 8 + - 2400.07 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 10.5861 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2819.15 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3776.06 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 3796.29 + - - - 5056 + - 1024 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 1847.4 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 4118.83 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 11 + - 3281.29 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 16 + - 1638.94 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 3547.47 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 13 + - 3719.76 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 26 + - 212.438 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 1942.87 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 12 + - 2875.17 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 12 + - 2476.1 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 3432.86 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3954.77 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1905.19 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 17 + - 2644.44 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 17 + - 3882.47 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4244.5 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1398.46 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 27 + - 9.40066 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 6 + - 1887.82 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 82.2777 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 2746.92 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 8 + - 1427.52 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 17 + - 3481.2 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 456.513 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 2289.42 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 26 + - 205.978 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 17 + - 4021.59 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 10 + - 139.438 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 12 + - 2577.71 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 18 + - 344.103 + - - - 3584 + - 448 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1121.35 + - - - 1856 + - 704 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1018.31 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2590.6 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 27 + - 95.7072 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4135.36 + - - - 4 + - 64 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 0.571274 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 8 + - 2503.51 + - - - 704 + - 3584 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1544.97 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 2902.6 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 47.7607 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 12 + - 3441.89 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 11 + - 3956.37 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 1021.51 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3095.87 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 18 + - 171.336 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 11 + - 3707.07 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4001.41 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 17 + - 3788.23 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 11 + - 3830.18 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 30 + - 119.503 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 517.998 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4108.88 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 11 + - 3783.06 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 27 + - 13.7786 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1627.34 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 11 + - 3396.28 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3228.52 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 29 + - 49.9777 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 436.068 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 12 + - 3324.06 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 3001.42 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 13 + - 3816.46 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 18 + - 917.365 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 3941.26 + - - - 704 + - 1408 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 818.777 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 12 + - 3009.58 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3860.72 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 29 + - 31.5077 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 4031.31 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 26 + - 113.732 + - - - 1856 + - 3584 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 2014.59 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 1108.19 + - - - 2368 + - 2944 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1952.09 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 17 + - 3910.92 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 1845.07 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 7 + - 2448.55 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 3341.42 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4142.27 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3137.4 + - - - 448 + - 448 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 244.388 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 30 + - 5.82025 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 8 + - 2710.22 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 13 + - 3512.42 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 80.0529 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 12 + - 2234.56 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 466.076 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 26 + - 58.8144 + - - - 64 + - 5888 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 416.965 + - - - 1408 + - 1408 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1181.8 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 8 + - 2720.64 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 4055.35 + - - - 3584 + - 64 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 3 + - 271.25 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 2899.21 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 2771.47 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 18 + - 1191.56 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 715.94 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 172.14 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 4358.37 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 3103.29 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 12 + - 2944.55 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 8 + - 1622.27 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 12 + - 2914.06 + - - - 3584 + - 1408 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1567.47 + - - - 1856 + - 4 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 23 + - 17.0914 + - - - 4 + - 128 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 1.15381 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 10 + - 273.067 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 30 + - 68.6962 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 1509.17 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 3943.29 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 79.8101 + - - - 256 + - 4 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 23 + - 2.54018 + - - - 6784 + - 1024 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 1865.86 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 22 + - 2028.93 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 2936.92 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 11 + - 3080.95 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 12 + - 2866.32 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 18 + - 752.052 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4067.72 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 17 + - 3547.2 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4149.76 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 97.0557 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 4013.96 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 17 + - 3845.39 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 8 + - 2299.34 + - - - 1408 + - 1856 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1554.93 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3492.96 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 4235.92 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 29 + - 3.25726 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 17 + - 3220.1 + - - - 704 + - 2944 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1285.32 + - - - 1024 + - 256 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 3 + - 303.276 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3770.72 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 11 + - 3517.65 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 18 + - 480.998 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 13 + - 3782.09 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 8 + - 2456.63 + - - - 128 + - 448 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 70.7951 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 12 + - 2414.18 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 120.494 + - - - 2368 + - 1024 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1491.06 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 8 + - 1757.37 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 12 + - 2475.26 + - - - 2944 + - 704 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1238.75 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 12 + - 3001.04 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 8 + - 3075.92 + - - - 5888 + - 4288 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2107.82 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 13 + - 3953.88 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 8 + - 2864.0 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 69.9434 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3843.46 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 28 + - 100.041 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 18 + - 1409.82 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 2708.35 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2683.31 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 27 + - 15.2409 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 11 + - 2821.54 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 2659.43 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 13 + - 3926.72 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 27 + - 124.17 + - - - 448 + - 2944 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1033.93 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 8 + - 1704.94 + - - - 6784 + - 128 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 4 + - 771.012 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 3913.99 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 27 + - 152.287 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 773.857 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 3955.21 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 13 + - 3754.09 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 8 + - 1531.7 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 3329.06 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 11 + - 3550.12 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 6 + - 2693.14 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 11 + - 3347.13 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 13 + - 3728.09 + - - - 2944 + - 1024 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1428.33 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 17 + - 3218.47 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 13 + - 3339.02 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 27 + - 14.4808 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 6 + - 2227.37 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 16 + - 1406.1 + - - - 256 + - 128 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 40.5796 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 3175.6 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 13 + - 3560.83 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 18 + - 909.648 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 8 + - 3011.61 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3932.12 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3873.56 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 12 + - 2982.83 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 803.821 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 17 + - 3745.13 + - - - 1856 + - 5888 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 2112.74 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 8 + - 2000.01 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 30 + - 0.255574 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3201.1 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 29 + - 65.3711 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 0.646846 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 2297.68 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 318.855 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 2095.88 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 18 + - 1144.91 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1784.55 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 8 + - 1028.02 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 11 + - 3796.07 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 8 + - 2121.58 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 17 + - 3622.0 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 12 + - 2469.34 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 6 + - 2857.36 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 11 + - 3337.89 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 14 + - 1916.79 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 13 + - 3429.41 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 4037.31 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 3163.48 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 3922.22 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 29 + - 180.735 + - - - 2368 + - 64 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 3 + - 183.006 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 5 + - 88.8624 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3927.6 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 17 + - 3437.32 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 14 + - 2652.88 + - - - 256 + - 6784 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 1206.57 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 8 + - 2166.22 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 22 + - 1771.58 + - - - 128 + - 1408 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 217.958 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3883.9 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 13 + - 4110.25 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 12 + - 3259.36 + - - - 6784 + - 6784 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2246.59 + - - - 448 + - 5056 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1412.92 + - - - 448 + - 2368 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 809.434 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3964.27 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 4013.88 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 13 + - 3986.16 + - - - 1408 + - 704 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 756.666 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 11 + - 3931.66 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 13 + - 3817.3 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1057.39 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 12 + - 2968.67 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 24.3327 + - - - 128 + - 64 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 10.3943 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 886.593 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3957.45 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 682.37 + - - - 256 + - 1408 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 404.146 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 20 + - 2361.69 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 13 + - 3163.07 + - - - 256 + - 4288 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 796.176 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 4355.54 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 18 + - 594.495 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 4118.95 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 11 + - 3112.92 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 3971.76 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3921.25 + - - - 5888 + - 128 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 4 + - 690.247 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 17 + - 3870.2 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 27 + - 83.9463 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 650.293 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 1125.77 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 22 + - 1301.34 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 12 + - 2461.23 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 12 + - 2887.0 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4132.33 + - - - 1408 + - 128 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 3 + - 226.697 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 2991.75 + - - - 5056 + - 704 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 1713.84 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 11 + - 3235.36 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 3907.02 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 27 + - 7.81431 + - - - 6784 + - 4 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 23 + - 62.2034 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4333.83 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 12 + - 3420.8 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 2476.98 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 3822.88 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 8 + - 1613.19 + - - - 5056 + - 5888 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2267.63 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 304.481 + - - - 1408 + - 64 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 3 + - 112.905 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 27 + - 66.7496 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 12 + - 3278.42 + - - - 4 + - 2368 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 21.7437 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 18 + - 440.05 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 13 + - 3237.94 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 18 + - 1895.95 + - - - 256 + - 5888 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 1061.5 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 17 + - 3734.33 + - - - 3584 + - 704 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1237.59 + - - - 448 + - 704 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 373.521 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 3513.81 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 18 + - 1300.77 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 92.1515 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 3993.0 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 3596.05 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 3516.59 + - - - 128 + - 5888 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 671.416 + - - - 64 + - 5056 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 373.815 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3490.96 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3731.32 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 17 + - 4048.09 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 11 + - 3101.42 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 12 + - 2640.87 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 6 + - 1731.14 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 8 + - 1963.24 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 12 + - 2165.03 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 13 + - 3985.49 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 13 + - 4105.76 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 12 + - 3216.64 + - - - 128 + - 128 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 20.7228 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4246.74 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 20 + - 2385.51 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 4157.67 + - - - 1024 + - 5888 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1585.36 + - - - 1856 + - 2368 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1808.65 + - - - 6784 + - 3584 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2193.65 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 14 + - 2683.72 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 18 + - 1248.08 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 11 + - 3500.0 + - - - 704 + - 256 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 3 + - 225.104 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 6 + - 1426.34 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 17 + - 3388.3 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 30 + - 91.8422 + - - - 5888 + - 4 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 23 + - 54.143 +- null diff --git a/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml new file mode 100644 index 000000000..749a4c02c --- /dev/null +++ b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml @@ -0,0 +1,19425 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 128 + LSCB: 64 + LSPA: 2 + LSPB: 4 + LVCA: 128 + LVCB: 64 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 1536 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 64 + LSCB: 64 + LSPA: 4 + LSPB: 4 + LVCA: 64 + LVCB: 64 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 1024 + LdsOffsetA: 0 + LdsOffsetB: 512 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 64 + LSPA: 8 + LSPB: 4 + LVCA: 8 + LVCB: 16 + LVPA: 2 + LVPB: 1 + LdcEqualsLdd: true + LdsNumElements: 1792 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 256 + LdsOffsetB_Blk: 1280 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x8_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 32 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 32 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 4 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x32x32_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 8 + LSPB: 4 + LVCA: 32 + LVCB: 64 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 4 + NumLoadsB: 8 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 8 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x32_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 4 + LSPB: 8 + LVCA: 64 + LVCB: 32 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 8 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 8 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x32x32_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 2 + LSPB: 4 + LVCA: 128 + LVCB: 64 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 4 + LSPB: 4 + LVCA: 64 + LVCB: 64 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 9 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 16 + LSPB: 8 + LVCA: 16 + LVCB: 32 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 10 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 4 + LSPB: 2 + LVCA: 64 + LVCB: 128 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 11 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 12 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU8_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 4 + LSPB: 2 + LVCA: 64 + LVCB: 128 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 13 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 14 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 256 + LdsOffsetA: 0 + LdsOffsetA_Blk: 512 + LdsOffsetB: 256 + LdsOffsetB_Blk: 768 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 15 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x32x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 4 + LSPB: 8 + LVCA: 64 + LVCB: 32 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 8 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 8 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 16 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x32x32_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 8 + LSPB: 16 + LVCA: 32 + LVCB: 16 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 17 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 18 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 8 + LSPB: 4 + LVCA: 32 + LVCB: 64 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 4 + NumLoadsB: 8 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 8 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 19 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT32x64x32_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 128 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 20 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x128x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 2 + LSPB: 4 + LVCA: 128 + LVCB: 64 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 21 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 64 + LSPA: 2 + LSPB: 4 + LVCA: 128 + LVCB: 64 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 22 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 128 + LSPA: 4 + LSPB: 2 + LVCA: 64 + LVCB: 128 + LVPA: 4 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 23 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 2 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 4 + LSPB: 4 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 24 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT16x16x4_SE_AMAS2_GRVW2_GSU1_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 4 + LSPB: 4 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 25 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT16x16x4_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 26 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 27 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU4_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 28 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU8_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 29 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 30 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 31 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 5056 + - - 7 + - 3113.52 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1408 + - - 18 + - 3973.05 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 2944 + - - 4 + - 3266.22 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 256 + - - 7 + - 3329.42 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 128 + - 64 + - - 15 + - 53.3898 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 704 + - - 20 + - 4018.68 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1856 + - - 10 + - 4102.71 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 448 + - 6784 + - - 7 + - 3621.28 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 448 + - - 4 + - 3861.05 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1024 + - - 20 + - 2908.32 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 128 + - - 18 + - 3238.61 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1024 + - - 20 + - 3388.28 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 256 + - - 18 + - 3394.98 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 448 + - - 7 + - 3183.0 + - - - 4 + - 448 + - 1 + - 128 + - 4 + - 4 + - 4 + - 448 + - - 25 + - 4.11367 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 4288 + - - 9 + - 3031.84 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 128 + - - 7 + - 1951.19 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 6784 + - - 10 + - 4231.82 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1408 + - - 19 + - 1456.36 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 4 + - 6784 + - - 26 + - 205.608 + - - - 4288 + - 4 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 4 + - - 25 + - 38.9822 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 5056 + - - 17 + - 4222.14 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1408 + - - 7 + - 2826.2 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 4288 + - - 17 + - 4371.52 + - - - 2368 + - 6784 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 6784 + - - 0 + - 2500.56 + - - - 1024 + - 5888 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 5888 + - - 1 + - 2114.62 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 6784 + - - 18 + - 3082.34 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 448 + - - 18 + - 3636.87 + - - - 5056 + - 128 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 3 + - 876.031 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 128 + - - 7 + - 2456.41 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1408 + - - 27 + - 24.756 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1856 + - - 15 + - 1281.99 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 4288 + - - 17 + - 4139.4 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1856 + - - 18 + - 3944.73 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 64 + - 64 + - - 14 + - 42.2813 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 4 + - - 28 + - 0.483019 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 6784 + - - 10 + - 4138.18 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1024 + - - 4 + - 3184.4 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 256 + - - 4 + - 3449.9 + - - - 3584 + - 2944 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 2944 + - - 0 + - 2406.23 + - - - 5888 + - 448 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 448 + - - 0 + - 1716.36 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1024 + - - 8 + - 3623.83 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1856 + - - 18 + - 4018.68 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1856 + - - 18 + - 3399.06 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 704 + - - 4 + - 2698.09 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 2944 + - - 20 + - 4214.12 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1856 + - - 4 + - 3998.14 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 4 + - - 30 + - 258.72 + - - - 2944 + - 3584 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 3584 + - - 0 + - 2416.56 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 6784 + - - 17 + - 4430.11 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1024 + - - 28 + - 47.7784 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1856 + - - 18 + - 3703.11 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 5888 + - - 27 + - 371.686 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 5056 + - - 18 + - 3887.2 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 3584 + - - 10 + - 4042.43 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 128 + - - 14 + - 1500.06 + - - - 1856 + - 1408 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 1408 + - - 0 + - 1681.22 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 128 + - - 7 + - 1747.63 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1408 + - - 18 + - 3771.23 + - - - 1408 + - 5888 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 5888 + - - 1 + - 2287.38 + - - - 448 + - 4 + - 1 + - 128 + - 448 + - 448 + - 448 + - 4 + - - 25 + - 4.26037 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 2368 + - - 10 + - 3980.93 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 64 + - - 7 + - 830.207 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1856 + - - 10 + - 4012.71 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1408 + - - 18 + - 4020.65 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 3584 + - - 7 + - 2445.51 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 704 + - - 6 + - 1106.03 + - - - 1024 + - 1024 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 1024 + - - 1 + - 974.287 + - - - 1856 + - 2368 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 2368 + - - 1 + - 2019.54 + - - - 3584 + - 256 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 256 + - - 1 + - 1053.85 + - - - 4288 + - 1024 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 1024 + - - 0 + - 1930.07 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 4 + - 2944 + - - 27 + - 49.1948 + - - - 704 + - 128 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 3 + - 151.768 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 2368 + - - 7 + - 4174.92 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 128 + - - 12 + - 150.657 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 6784 + - - 10 + - 4287.21 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 704 + - 4 + - - 28 + - 13.8421 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 4288 + - - 10 + - 4137.71 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 452.291 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 2944 + - - 10 + - 3994.34 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 128 + - - 7 + - 2155.41 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 64 + - - 19 + - 1099.31 + - - - 1408 + - 5056 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 5056 + - - 0 + - 2168.32 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 128 + - - 18 + - 3018.97 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 704 + - 704 + - - 7 + - 2156.81 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1856 + - - 18 + - 3856.87 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 3584 + - - 10 + - 4040.35 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1408 + - - 4 + - 4006.97 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1024 + - - 15 + - 395.689 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 2368 + - - 18 + - 4161.31 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 5056 + - - 17 + - 4266.99 + - - - 704 + - 6784 + - 1 + - 128 + - 704 + - 704 + - 704 + - 6784 + - - 1 + - 2037.74 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 448 + - 704 + - - 4 + - 2232.86 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 4 + - 704 + - - 27 + - 13.3499 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 128 + - 704 + - - 7 + - 837.44 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 704 + - - 7 + - 3796.58 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 5056 + - - 18 + - 4068.92 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 2368 + - - 28 + - 260.606 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1408 + - - 18 + - 4171.04 + - - - 448 + - 64 + - 1 + - 128 + - 448 + - 448 + - 448 + - 64 + - - 3 + - 52.6696 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1408 + - - 15 + - 1763.66 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1024 + - - 17 + - 3621.89 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 4288 + - - 4 + - 3864.67 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 2944 + - - 10 + - 4263.67 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 2368 + - - 18 + - 3987.55 + - - - 1856 + - 128 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 388.262 + - - - 5056 + - 256 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 256 + - - 1 + - 1234.91 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1024 + - - 17 + - 2945.89 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 448 + - - 14 + - 433.369 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 2368 + - - 18 + - 3930.78 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3584 + - - 10 + - 4287.53 + - - - 4288 + - 6784 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 6784 + - - 0 + - 2601.23 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 2368 + - - 18 + - 4111.79 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 128 + - 448 + - - 15 + - 350.192 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 448 + - 2944 + - - 18 + - 3447.2 + - - - 2368 + - 4 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 4 + - - 25 + - 21.5581 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 448 + - - 4 + - 4069.89 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1408 + - - 4 + - 3078.35 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 704 + - 6784 + - - 18 + - 3982.71 + - - - 1024 + - 5056 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 5056 + - - 1 + - 2030.33 + - - - 1856 + - 64 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 64 + - - 3 + - 200.479 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1024 + - - 20 + - 3451.09 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1856 + - - 18 + - 4149.44 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 64 + - - 12 + - 134.063 + - - - 5888 + - 1856 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 1856 + - - 0 + - 2361.25 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 448 + - - 18 + - 3078.42 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 18 + - 2262.41 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 256 + - - 7 + - 2132.18 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1024 + - - 7 + - 754.371 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 5056 + - - 18 + - 4018.19 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 448 + - 448 + - - 15 + - 1105.43 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 6784 + - - 10 + - 4265.75 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 4288 + - - 10 + - 4189.99 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 5888 + - - 10 + - 4192.46 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 128 + - - 7 + - 2204.21 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 64 + - - 15 + - 531.047 + - - - 128 + - 4 + - 1 + - 128 + - 128 + - 128 + - 128 + - 4 + - - 25 + - 1.2282 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 5056 + - - 17 + - 4425.06 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1856 + - - 17 + - 3892.55 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 6784 + - - 4 + - 3886.67 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 128 + - - 7 + - 3056.13 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 4 + - - 28 + - 99.8689 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1408 + - - 18 + - 3710.78 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 5056 + - - 17 + - 4186.7 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 5056 + - - 18 + - 4089.12 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 128 + - 2368 + - - 15 + - 1556.87 + - - - 2944 + - 448 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 448 + - - 1 + - 1261.36 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 5888 + - - 10 + - 4314.13 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 7 + - 1769.07 + - - - 256 + - 64 + - 1 + - 128 + - 256 + - 256 + - 256 + - 64 + - - 3 + - 27.2783 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 64 + - - 19 + - 1937.05 + - - - 6784 + - 128 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 3 + - 1110.6 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 4288 + - - 18 + - 4007.98 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 256 + - - 4 + - 3635.96 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 128 + - - 16 + - 273.678 + - - - 4288 + - 4288 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 4288 + - - 0 + - 2574.53 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 4 + - - 26 + - 203.68 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 4 + - - 28 + - 40.6862 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 4288 + - - 18 + - 4160.53 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 128 + - - 28 + - 14.4991 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 704 + - - 7 + - 2823.69 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 256 + - 2368 + - - 4 + - 2615.55 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1408 + - - 28 + - 178.849 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 704 + - - 7 + - 3949.11 + - - - 6784 + - 2944 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 2944 + - - 0 + - 2573.52 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 448 + - - 7 + - 2006.47 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 256 + - - 7 + - 2239.72 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1024 + - - 11 + - 3348.51 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1856 + - - 18 + - 4050.74 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1024 + - - 20 + - 3787.02 + - - - 64 + - 4288 + - 1 + - 128 + - 64 + - 64 + - 64 + - 4288 + - - 3 + - 411.519 + - - - 1408 + - 2368 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 2368 + - - 1 + - 1845.25 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 2944 + - - 4 + - 3625.7 + - - - 4 + - 1408 + - 1 + - 128 + - 4 + - 4 + - 4 + - 1408 + - - 25 + - 12.3105 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 64 + - - 4 + - 1628.97 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 2944 + - - 4 + - 3049.51 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 4 + - - 28 + - 7.88776 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1856 + - - 7 + - 3124.18 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1856 + - - 27 + - 32.4546 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 6784 + - - 10 + - 4259.01 + - - - 2368 + - 5888 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 5888 + - - 0 + - 2439.42 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 256 + - - 5 + - 415.341 + - - - 2368 + - 1856 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 1856 + - - 1 + - 2018.96 + - - - 2944 + - 4 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 4 + - - 25 + - 26.9168 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 4 + - - 30 + - 32.5882 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 704 + - 2368 + - - 18 + - 3002.04 + - - - 1856 + - 448 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 448 + - - 3 + - 1056.7 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 5888 + - - 17 + - 4367.53 + - - - 3584 + - 5056 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 5056 + - - 0 + - 2540.59 + - - - 5888 + - 2944 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 2944 + - - 0 + - 2558.8 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 704 + - - 20 + - 3946.11 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 256 + - - 4 + - 3182.39 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 2944 + - - 10 + - 4208.2 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3584 + - - 17 + - 4228.98 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 704 + - - 9 + - 2122.08 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1856 + - - 19 + - 1870.33 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 2944 + - - 18 + - 3985.41 + - - - 1408 + - 704 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 704 + - - 1 + - 1005.05 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 5056 + - - 4 + - 2745.48 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1856 + - - 7 + - 3908.07 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 4288 + - - 17 + - 4242.43 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1024 + - - 28 + - 92.6772 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 3584 + - - 20 + - 4352.28 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1408 + - - 18 + - 3835.15 + - - - 3584 + - 4 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 4 + - - 25 + - 32.7683 + - - - 2944 + - 5056 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 5056 + - - 0 + - 2467.45 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 2944 + - - 4 + - 3754.61 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 3584 + - - 10 + - 4248.22 + - - - 1856 + - 4288 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 4288 + - - 1 + - 2232.8 + - - - 1408 + - 1856 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 1856 + - - 0 + - 1688.69 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 64 + - 448 + - - 15 + - 182.044 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1856 + - - 10 + - 4055.91 + - - - 3584 + - 1408 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 1408 + - - 1 + - 2027.13 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 448 + - - 18 + - 3424.67 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 4 + - - 30 + - 190.48 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 6784 + - - 4 + - 3595.4 + - - - 448 + - 5056 + - 1 + - 128 + - 448 + - 448 + - 448 + - 5056 + - - 1 + - 1580.52 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1024 + - - 18 + - 2757.21 + - - - 1408 + - 4 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 4 + - - 25 + - 12.9846 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 256 + - 5056 + - - 18 + - 3390.35 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 5888 + - - 4 + - 3251.99 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 128 + - 5888 + - - 18 + - 2270.93 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 4 + - - 30 + - 59.1175 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 64 + - - 7 + - 1368.67 + - - - 5888 + - 1408 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 1408 + - - 1 + - 2299.27 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 2944 + - - 4 + - 3143.19 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 5888 + - - 17 + - 4258.38 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 256 + - - 4 + - 3139.1 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 128 + - 5888 + - - 4 + - 2825.14 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 256 + - - 19 + - 1845.66 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 2944 + - - 10 + - 3973.47 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 4288 + - - 7 + - 2232.13 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 6784 + - - 18 + - 4048.94 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 5888 + - - 18 + - 3939.39 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 7 + - 662.458 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 256 + - 4 + - - 28 + - 15.4809 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 3584 + - - 10 + - 4100.08 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 64 + - - 7 + - 1985.58 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 64 + - - 7 + - 1948.63 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 2368 + - - 18 + - 4086.94 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1408 + - - 19 + - 1081.73 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 3584 + - - 17 + - 3387.47 + - - - 448 + - 1408 + - 1 + - 128 + - 448 + - 448 + - 448 + - 1408 + - - 3 + - 856.752 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 4 + - - 26 + - 303.992 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 256 + - - 14 + - 1190.0 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 4 + - 1024 + - - 27 + - 18.3061 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 6784 + - - 10 + - 4419.48 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1024 + - - 7 + - 1435.7 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 2944 + - - 7 + - 3206.43 + - - - 64 + - 448 + - 1 + - 128 + - 64 + - 64 + - 64 + - 448 + - - 3 + - 45.466 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 448 + - - 7 + - 2334.16 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 64 + - 4288 + - - 7 + - 1961.69 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 5888 + - - 17 + - 4323.1 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 256 + - 2944 + - - 4 + - 2827.34 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 2368 + - - 7 + - 4048.01 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 1024 + - - 14 + - 1117.34 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 2368 + - - 18 + - 3876.41 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 448 + - - 18 + - 3311.23 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 2368 + - - 28 + - 184.339 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 448 + - 4 + - - 31 + - 9.50978 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 704 + - 3584 + - - 4 + - 3359.52 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1408 + - - 9 + - 3238.2 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 775.397 + - - - 448 + - 1856 + - 1 + - 128 + - 448 + - 448 + - 448 + - 1856 + - - 3 + - 1035.32 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 3796.1 + - - - 704 + - 1856 + - 1 + - 128 + - 704 + - 704 + - 704 + - 1856 + - - 1 + - 1255.61 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 256 + - 128 + - - 7 + - 302.474 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 448 + - - 28 + - 46.1919 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 6784 + - - 4 + - 3748.81 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 2944 + - - 17 + - 4186.12 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 256 + - - 9 + - 2166.85 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 5056 + - - 18 + - 4053.85 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 4 + - 2944 + - - 27 + - 118.501 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 64 + - - 5 + - 402.109 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 4 + - 3584 + - - 30 + - 59.0414 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3584 + - - 17 + - 4367.01 + - - - 256 + - 1408 + - 1 + - 128 + - 256 + - 256 + - 256 + - 1408 + - - 1 + - 482.205 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 704 + - - 18 + - 3021.1 + - - - 4288 + - 704 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 704 + - - 1 + - 1747.47 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 6784 + - - 10 + - 4285.98 + - - - 448 + - 4288 + - 1 + - 128 + - 448 + - 448 + - 448 + - 4288 + - - 2 + - 1632.31 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1856 + - - 18 + - 3969.34 + - - - 5056 + - 2368 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 2368 + - - 0 + - 2391.83 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 704 + - - 18 + - 3625.17 + - - - 2368 + - 1024 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 1024 + - - 0 + - 1546.33 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1024 + - - 18 + - 3481.25 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1408 + - - 18 + - 3864.35 + - - - 4288 + - 5888 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 5888 + - - 0 + - 2579.1 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 448 + - - 18 + - 3467.02 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 128 + - - 15 + - 1542.02 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 18 + - 3061.96 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1408 + - - 7 + - 834.209 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 704 + - 4 + - - 28 + - 36.0929 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 256 + - - 7 + - 1871.06 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3584 + - - 7 + - 2616.41 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 704 + - 3584 + - - 10 + - 3110.18 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3584 + - - 4 + - 3970.89 + - - - 6784 + - 3584 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 3584 + - - 0 + - 2645.33 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 4288 + - - 4 + - 3530.93 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 128 + - 5056 + - - 4 + - 2044.36 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 2368 + - - 4 + - 3056.02 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 64 + - - 7 + - 2652.19 + - - - 4288 + - 64 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 64 + - - 3 + - 414.237 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 6784 + - - 10 + - 4405.4 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 704 + - 2944 + - - 4 + - 3469.96 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1024 + - - 20 + - 4101.81 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 5888 + - - 18 + - 4137.88 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 4 + - - 27 + - 50.786 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1408 + - - 7 + - 2553.73 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 4 + - 4288 + - - 27 + - 67.1804 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 5888 + - - 18 + - 3948.79 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 448 + - 2368 + - - 18 + - 2507.21 + - - - 3584 + - 5888 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 5888 + - - 0 + - 2592.46 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 4 + - 4 + - - 28 + - 0.265744 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 64 + - - 7 + - 604.367 + - - - 4288 + - 1408 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 1408 + - - 1 + - 2130.57 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1856 + - - 7 + - 1093.31 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 448 + - 1408 + - - 7 + - 2743.78 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 448 + - - 4 + - 3883.56 + - - - 448 + - 256 + - 1 + - 128 + - 448 + - 448 + - 448 + - 256 + - - 3 + - 194.181 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 128 + - - 7 + - 1629.14 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 5056 + - - 18 + - 3988.79 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 256 + - - 28 + - 28.0411 + - - - 6784 + - 5056 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 5056 + - - 0 + - 2709.18 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3584 + - - 4 + - 3666.3 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1024 + - - 20 + - 3268.29 + - - - 5056 + - 64 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 64 + - - 3 + - 480.719 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 704 + - - 7 + - 3478.45 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 6784 + - - 10 + - 3993.99 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 704 + - 4288 + - - 18 + - 3350.68 + - - - 64 + - 5056 + - 1 + - 128 + - 64 + - 64 + - 64 + - 5056 + - - 3 + - 468.962 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 1024 + - - 18 + - 2733.19 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 5056 + - - 10 + - 4249.37 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 704 + - - 7 + - 4025.83 + - - - 2944 + - 64 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 64 + - - 3 + - 317.332 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 704 + - - 9 + - 3259.19 + - - - 4 + - 64 + - 1 + - 128 + - 4 + - 4 + - 4 + - 64 + - - 25 + - 0.548331 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 2944 + - - 10 + - 4243.62 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1408 + - - 18 + - 3974.97 + - - - 256 + - 5888 + - 1 + - 128 + - 256 + - 256 + - 256 + - 5888 + - - 1 + - 1294.54 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1024 + - - 22 + - 3589.81 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 4 + - - 27 + - 158.022 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1856 + - - 18 + - 3321.05 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 128 + - - 11 + - 2726.97 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 64 + - 64 + - - 7 + - 22.2533 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 256 + - - 4 + - 3759.56 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 6784 + - - 10 + - 4303.45 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1024 + - - 7 + - 2194.33 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 4288 + - - 17 + - 4360.59 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 128 + - 3584 + - - 7 + - 2168.4 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 4 + - 3584 + - - 27 + - 139.297 + - - - 6784 + - 2368 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 2368 + - - 0 + - 2519.43 + - - - 128 + - 256 + - 1 + - 128 + - 128 + - 128 + - 128 + - 256 + - - 3 + - 56.0137 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 2944 + - - 18 + - 3243.75 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 448 + - - 7 + - 3055.04 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 2368 + - - 10 + - 4208.91 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 3584 + - - 4 + - 3420.14 + - - - 128 + - 2944 + - 1 + - 128 + - 128 + - 128 + - 128 + - 2944 + - - 3 + - 523.833 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 704 + - - 14 + - 1522.61 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 1856 + - - 18 + - 3832.47 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3584 + - - 17 + - 4119.44 + - - - 2944 + - 128 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 3 + - 581.419 + - - - 1856 + - 6784 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 6784 + - - 1 + - 2409.21 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 4288 + - - 20 + - 4380.09 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 3584 + - - 10 + - 4080.5 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 448 + - - 7 + - 3829.87 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3584 + - - 20 + - 4390.34 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 5888 + - - 10 + - 4275.07 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 256 + - - 7 + - 2619.08 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 448 + - - 7 + - 3663.47 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 704 + - - 18 + - 2339.19 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 448 + - - 4 + - 3377.32 + - - - 6784 + - 1024 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 1024 + - - 0 + - 2125.22 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 2368 + - - 18 + - 4016.29 + - - - 1024 + - 1408 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 1408 + - - 1 + - 1375.59 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 4 + - - 29 + - 99.9254 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 817.831 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 4288 + - - 10 + - 4202.31 + - - - 3584 + - 1856 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 1856 + - - 0 + - 2196.26 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 2944 + - - 18 + - 3930.31 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 5888 + - - 17 + - 4306.91 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 128 + - 5056 + - - 4 + - 2797.3 + - - - 5888 + - 1024 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 1024 + - - 0 + - 2050.35 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 6784 + - - 7 + - 3450.0 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 704 + - - 7 + - 3637.63 + - - - 256 + - 2944 + - 1 + - 128 + - 256 + - 256 + - 256 + - 2944 + - - 1 + - 901.917 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3584 + - - 10 + - 4071.21 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 448 + - 128 + - - 15 + - 354.249 + - - - 1856 + - 4 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 4 + - - 25 + - 16.8251 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 6784 + - - 10 + - 4393.61 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 2368 + - - 18 + - 4075.35 + - - - 448 + - 704 + - 1 + - 128 + - 448 + - 448 + - 448 + - 704 + - - 3 + - 501.617 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 4288 + - - 17 + - 4322.53 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 2368 + - - 18 + - 3765.74 + - - - 2944 + - 4288 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 4288 + - - 0 + - 2496.38 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 2944 + - - 7 + - 2034.97 + - - - 1856 + - 1024 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 1024 + - - 2 + - 1544.37 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 704 + - - 7 + - 3674.62 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 2944 + - - 20 + - 4252.0 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 704 + - - 4 + - 3858.27 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1856 + - - 17 + - 4287.04 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 5056 + - - 18 + - 3869.6 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1856 + - - 20 + - 3695.33 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 448 + - - 7 + - 3465.82 + - - - 4288 + - 448 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 448 + - - 2 + - 1651.61 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 256 + - - 7 + - 3075.82 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 704 + - - 4 + - 3504.25 + - - - 704 + - 4288 + - 1 + - 128 + - 704 + - 704 + - 704 + - 4288 + - - 1 + - 1728.71 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1856 + - - 18 + - 4128.67 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 704 + - 2944 + - - 18 + - 3021.52 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 765.042 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 5056 + - - 10 + - 4278.86 + - - - 64 + - 2368 + - 1 + - 128 + - 64 + - 64 + - 64 + - 2368 + - - 3 + - 250.241 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 448 + - - 18 + - 2868.8 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 2368 + - - 4 + - 3289.5 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 64 + - - 12 + - 248.026 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 5056 + - - 17 + - 4065.98 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3584 + - - 21 + - 3791.52 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1408 + - - 18 + - 3892.98 + - - - 448 + - 3584 + - 1 + - 128 + - 448 + - 448 + - 448 + - 3584 + - - 2 + - 1458.84 + - - - 128 + - 1408 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1408 + - - 3 + - 306.438 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 1024 + - - 17 + - 3394.41 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 704 + - - 4 + - 1946.49 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 2378.82 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 6784 + - - 10 + - 4373.11 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 3584 + - - 17 + - 4095.54 + - - - 5888 + - 5056 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 5056 + - - 0 + - 2660.24 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 64 + - - 4 + - 2292.55 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 128 + - - 28 + - 20.4211 + - - - 4288 + - 128 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 3 + - 757.707 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 704 + - 2368 + - - 18 + - 3294.34 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 5888 + - - 10 + - 4325.87 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 3396.85 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 2646.84 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 5056 + - - 7 + - 3248.34 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 64 + - - 7 + - 3192.06 + - - - 5056 + - 5056 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 5056 + - - 0 + - 2591.14 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 448 + - - 4 + - 4200.73 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 704 + - 256 + - - 7 + - 1616.96 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 64 + - - 4 + - 3663.64 + - - - 2368 + - 2368 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 2368 + - - 1 + - 2102.13 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1024 + - - 7 + - 1198.37 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 448 + - - 7 + - 2693.0 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 4288 + - - 18 + - 3843.54 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 2944 + - - 10 + - 4104.08 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 448 + - - 6 + - 1832.89 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 704 + - - 9 + - 2854.84 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 704 + - 5888 + - - 18 + - 3598.61 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 4 + - 256 + - - 28 + - 15.1237 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 64 + - - 14 + - 1539.49 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1408 + - - 4 + - 3051.08 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 128 + - 448 + - - 4 + - 532.401 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 704 + - - 4 + - 3602.24 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 256 + - - 4 + - 3264.52 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 3584 + - - 17 + - 4359.56 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 448 + - - 7 + - 2737.58 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1856 + - - 18 + - 3676.41 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 704 + - 64 + - - 7 + - 415.902 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 64 + - - 7 + - 3473.41 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 256 + - 704 + - - 4 + - 1601.99 + - - - 6784 + - 6784 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 6784 + - - 0 + - 2747.11 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 128 + - 128 + - - 15 + - 107.657 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 2368 + - - 18 + - 3661.38 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 2368 + - - 18 + - 3993.21 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 64 + - 704 + - - 7 + - 417.911 + - - - 1856 + - 704 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 704 + - - 1 + - 1258.64 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 4288 + - - 10 + - 4225.49 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 448 + - 4 + - - 31 + - 24.9322 + - - - 64 + - 1024 + - 1 + - 128 + - 64 + - 64 + - 64 + - 1024 + - - 3 + - 110.145 + - - - 2944 + - 1856 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 1856 + - - 0 + - 2084.03 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 64 + - - 7 + - 1046.76 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 3584 + - - 10 + - 4278.32 + - - - 3584 + - 6784 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 6784 + - - 0 + - 2641.2 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 256 + - 6784 + - - 18 + - 3413.67 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 15 + - 996.057 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 704 + - - 18 + - 3029.81 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 2368 + - - 4 + - 2464.44 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 5888 + - - 20 + - 4117.44 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 128 + - 3584 + - - 4 + - 3161.54 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1024 + - - 19 + - 804.387 + - - - 4288 + - 5056 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 5056 + - - 0 + - 2562.86 + - - - 1856 + - 1856 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 1856 + - - 1 + - 1826.84 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1024 + - - 17 + - 3404.05 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 1010.42 + - - - 1856 + - 5888 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 5888 + - - 1 + - 2349.51 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 4 + - 5056 + - - 27 + - 176.822 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1408 + - - 23 + - 3492.59 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 3584 + - - 18 + - 2711.0 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 64 + - - 7 + - 2631.56 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1024 + - - 18 + - 3653.64 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 64 + - - 12 + - 156.437 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 128 + - 2944 + - - 4 + - 1841.01 + - - - 1856 + - 2944 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 2944 + - - 0 + - 2090.01 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 4 + - 2368 + - - 27 + - 40.0931 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 128 + - - 12 + - 243.942 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 256 + - - 18 + - 3403.22 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 4288 + - - 17 + - 4292.66 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 256 + - - 7 + - 2924.32 + - - - 448 + - 5888 + - 1 + - 128 + - 448 + - 448 + - 448 + - 5888 + - - 1 + - 1660.31 + - - - 1408 + - 6784 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 6784 + - - 0 + - 2379.79 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 6784 + - - 10 + - 4355.93 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 4288 + - - 18 + - 4020.58 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 4 + - - 30 + - 303.241 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 3584 + - - 17 + - 4253.07 + - - - 2944 + - 1024 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 1024 + - - 1 + - 1581.98 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 6784 + - - 26 + - 343.851 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 448 + - - 7 + - 3013.1 + - - - 4 + - 1856 + - 1 + - 128 + - 4 + - 4 + - 4 + - 1856 + - - 25 + - 16.9209 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 448 + - 64 + - - 15 + - 181.325 + - - - 128 + - 64 + - 1 + - 128 + - 128 + - 128 + - 128 + - 64 + - - 3 + - 14.1394 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 128 + - - 15 + - 1290.69 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 704 + - 6784 + - - 18 + - 3783.86 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 64 + - - 7 + - 870.676 + - - - 5888 + - 704 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 704 + - - 1 + - 1953.54 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 3584 + - - 20 + - 4095.68 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 704 + - 1856 + - - 18 + - 3428.15 + - - - 256 + - 5056 + - 1 + - 128 + - 256 + - 256 + - 256 + - 5056 + - - 1 + - 1252.08 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2944 + - - 18 + - 2286.0 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 256 + - - 5 + - 490.644 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1856 + - - 20 + - 4151.88 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 448 + - - 18 + - 2496.15 + - - - 2944 + - 2944 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 2944 + - - 0 + - 2350.01 + - - - 64 + - 256 + - 1 + - 128 + - 64 + - 64 + - 64 + - 256 + - - 3 + - 26.2669 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 256 + - - 4 + - 3965.53 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 5056 + - - 10 + - 4320.66 + - - - 1408 + - 3584 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 3584 + - - 1 + - 2021.04 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 64 + - - 28 + - 7.7913 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 3584 + - - 10 + - 4019.58 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 256 + - - 14 + - 264.41 + - - - 704 + - 1408 + - 1 + - 128 + - 704 + - 704 + - 704 + - 1408 + - - 1 + - 1042.03 + - - - 2368 + - 704 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 704 + - - 2 + - 1443.35 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 6784 + - - 18 + - 3944.76 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1024 + - - 4 + - 3656.96 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 64 + - 4 + - - 28 + - 4.39642 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 704 + - 128 + - - 4 + - 831.004 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 2944 + - - 18 + - 3875.96 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1856 + - - 4 + - 3831.19 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1024 + - - 20 + - 3930.41 + - - - 1024 + - 2368 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 2368 + - - 1 + - 1655.18 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 64 + - - 7 + - 1858.03 + - - - 704 + - 5056 + - 1 + - 128 + - 704 + - 704 + - 704 + - 5056 + - - 1 + - 1836.53 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 448 + - - 18 + - 3133.99 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 6784 + - - 4 + - 4087.96 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 4288 + - - 4 + - 4202.05 + - - - 448 + - 2944 + - 1 + - 128 + - 448 + - 448 + - 448 + - 2944 + - - 1 + - 1259.1 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 64 + - 448 + - - 4 + - 266.2 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 256 + - 64 + - - 4 + - 150.802 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 2368 + - - 18 + - 4150.08 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 448 + - - 7 + - 3869.44 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 6784 + - - 10 + - 4228.86 + - - - 1024 + - 4288 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 4288 + - - 1 + - 2006.13 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1024 + - - 18 + - 3398.52 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1408 + - - 10 + - 4189.86 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 64 + - - 19 + - 1489.79 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 256 + - 5888 + - - 4 + - 3157.4 + - - - 2368 + - 128 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 3 + - 485.452 + - - - 1024 + - 1856 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 1856 + - - 1 + - 1565.04 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1408 + - - 7 + - 3090.7 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 256 + - - 4 + - 3104.03 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 128 + - - 18 + - 2621.44 + - - - 4 + - 4 + - 1 + - 128 + - 4 + - 4 + - 4 + - 4 + - - 25 + - 0.0345949 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 64 + - 6784 + - - 7 + - 3046.85 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 128 + - 4 + - - 30 + - 3.30323 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 2368 + - - 7 + - 1646.35 + - - - 704 + - 64 + - 1 + - 128 + - 704 + - 704 + - 704 + - 64 + - - 3 + - 79.7451 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1856 + - - 7 + - 2752.11 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1856 + - - 17 + - 4081.4 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 4288 + - - 18 + - 3797.55 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 5056 + - - 20 + - 3949.43 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 256 + - - 19 + - 1383.42 + - - - 2368 + - 448 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 448 + - - 1 + - 1038.79 + - - - 2368 + - 64 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 64 + - - 3 + - 257.961 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 3584 + - - 4 + - 3602.42 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 448 + - - 4 + - 3615.0 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 2944 + - - 7 + - 2198.01 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 704 + - 64 + - - 15 + - 280.504 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 4 + - 64 + - - 31 + - 1.66504 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 2368 + - - 7 + - 2924.63 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 5056 + - - 18 + - 3738.15 + - - - 4288 + - 2944 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 2944 + - - 1 + - 2408.85 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 2944 + - - 4 + - 3834.69 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 1024 + - - 11 + - 3654.42 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 256 + - - 4 + - 3688.11 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 5056 + - - 4 + - 3978.54 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 6784 + - - 10 + - 4112.92 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 448 + - 448 + - - 7 + - 1769.29 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 2944 + - - 20 + - 4115.75 + - - - 3584 + - 3584 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 3584 + - - 0 + - 2393.12 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 2944 + - - 28 + - 205.439 + - - - 5056 + - 2944 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 2944 + - - 0 + - 2466.94 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 128 + - - 9 + - 2755.49 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 448 + - - 7 + - 2559.7 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 2944 + - - 10 + - 4289.38 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 4 + - 5888 + - - 26 + - 89.4026 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 128 + - 2944 + - - 7 + - 2652.19 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 5888 + - - 20 + - 4387.06 + - - - 6784 + - 4 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 4 + - - 25 + - 60.8948 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 64 + - - 7 + - 2232.13 + - - - 5888 + - 3584 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 3584 + - - 0 + - 2599.05 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 4288 + - - 27 + - 262.078 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1856 + - - 4 + - 4030.52 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1024 + - - 18 + - 2883.83 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 3584 + - - 10 + - 4219.95 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 128 + - - 18 + - 2826.24 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 128 + - - 15 + - 212.262 + - - - 5888 + - 6784 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 6784 + - - 0 + - 2725.29 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 128 + - - 15 + - 1008.25 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 5888 + - - 18 + - 4094.36 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 6784 + - - 4 + - 3695.82 + - - - 128 + - 4288 + - 1 + - 128 + - 128 + - 128 + - 128 + - 4288 + - - 3 + - 679.708 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 2368 + - - 10 + - 4095.54 + - - - 3584 + - 4288 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 4288 + - - 0 + - 2510.89 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 4288 + - - 27 + - 336.41 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 64 + - - 19 + - 807.929 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1408 + - - 18 + - 3957.28 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1408 + - - 18 + - 2323.77 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 5888 + - - 18 + - 3895.64 + - - - 64 + - 128 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 3 + - 13.2396 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 3584 + - - 17 + - 4007.14 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 1408 + - - 18 + - 3843.87 + - - - 4 + - 6784 + - 1 + - 128 + - 4 + - 4 + - 4 + - 6784 + - - 24 + - 60.7244 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 5056 + - - 18 + - 4011.8 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3584 + - - 27 + - 299.839 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 64 + - 4 + - - 30 + - 1.77701 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1024 + - - 17 + - 3679.32 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 5888 + - - 18 + - 4172.63 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 256 + - - 28 + - 40.1495 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 5056 + - - 18 + - 4015.24 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 256 + - 448 + - - 7 + - 1056.63 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 3584 + - - 17 + - 4099.34 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 256 + - - 7 + - 3818.82 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 64 + - - 7 + - 1687.31 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 4288 + - - 17 + - 4338.94 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1856 + - - 28 + - 157.033 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1856 + - - 18 + - 3018.91 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 256 + - - 23 + - 3172.11 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 6784 + - - 17 + - 4204.59 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1024 + - - 18 + - 2847.39 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 5888 + - - 18 + - 4149.61 + - - - 5056 + - 4288 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 4288 + - - 0 + - 2562.86 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 6784 + - - 4 + - 3986.64 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 4288 + - - 4 + - 2662.89 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 128 + - - 7 + - 1192.69 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 4 + - - 27 + - 78.0661 + - - - 256 + - 3584 + - 1 + - 128 + - 256 + - 256 + - 256 + - 3584 + - - 1 + - 1038.93 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 64 + - - 5 + - 698.744 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 704 + - - 28 + - 98.525 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1024 + - - 17 + - 3545.23 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 3584 + - - 17 + - 4326.23 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 704 + - 5056 + - - 18 + - 3478.97 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 6784 + - - 17 + - 4218.14 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 1408 + - - 18 + - 3632.12 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 128 + - 1408 + - - 15 + - 996.057 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1024 + - - 17 + - 3544.86 + - - - 6784 + - 256 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 256 + - - 2 + - 1537.76 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 64 + - - 7 + - 3020.35 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 704 + - - 7 + - 2409.24 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 31 + - 5.70871 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 4 + - - 26 + - 341.665 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 4 + - - 31 + - 203.067 + - - - 128 + - 3584 + - 1 + - 128 + - 128 + - 128 + - 128 + - 3584 + - - 3 + - 609.637 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 3751.53 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 128 + - - 7 + - 3666.09 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 4 + - - 30 + - 314.513 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 4288 + - - 17 + - 4302.74 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 64 + - 3584 + - - 4 + - 1980.22 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 256 + - - 23 + - 3486.71 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 128 + - - 7 + - 3194.01 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 2368 + - - 18 + - 3916.28 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 2944 + - - 18 + - 3613.32 + - - - 256 + - 448 + - 1 + - 128 + - 256 + - 256 + - 256 + - 448 + - - 3 + - 195.63 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 2368 + - - 10 + - 4219.07 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1024 + - - 13 + - 3334.33 + - - - 5056 + - 3584 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 3584 + - - 0 + - 2541.48 + - - - 128 + - 448 + - 1 + - 128 + - 128 + - 128 + - 128 + - 448 + - - 3 + - 98.4446 + - - - 5056 + - 4 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 4 + - - 25 + - 45.5115 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1856 + - - 7 + - 684.881 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 64 + - - 15 + - 1638.4 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 256 + - - 7 + - 2572.71 + - - - 704 + - 448 + - 1 + - 128 + - 704 + - 704 + - 704 + - 448 + - - 3 + - 507.163 + - - - 1024 + - 6784 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 6784 + - - 1 + - 2163.7 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 2944 + - - 18 + - 4017.85 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1408 + - - 18 + - 2895.43 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 5056 + - - 17 + - 4221.24 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 704 + - - 5 + - 961.688 + - - - 128 + - 704 + - 1 + - 128 + - 128 + - 128 + - 128 + - 704 + - - 3 + - 153.545 + - - - 128 + - 5056 + - 1 + - 128 + - 128 + - 128 + - 128 + - 5056 + - - 3 + - 786.233 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 15 + - 397.942 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 64 + - - 12 + - 87.6317 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 448 + - - 28 + - 66.5006 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 5888 + - - 10 + - 4293.47 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 5056 + - - 18 + - 4110.19 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 128 + - 704 + - - 7 + - 530.071 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 5056 + - - 17 + - 4385.19 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 448 + - 64 + - - 7 + - 265.43 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 128 + - - 11 + - 3079.28 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 4288 + - - 18 + - 4112.83 + - - - 4288 + - 1856 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 1856 + - - 1 + - 2206.49 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 2944 + - - 10 + - 4255.37 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1408 + - - 4 + - 3177.6 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 704 + - - 7 + - 3550.0 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1024 + - - 17 + - 3641.44 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 3584 + - - 17 + - 4170.99 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 448 + - - 5 + - 1195.15 + - - - 64 + - 64 + - 1 + - 128 + - 64 + - 64 + - 64 + - 64 + - - 3 + - 6.32587 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 2944 + - - 10 + - 4257.95 + - - - 1408 + - 2944 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 2944 + - - 1 + - 1924.62 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 2944 + - - 18 + - 3974.12 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 448 + - - 4 + - 2165.2 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 704 + - - 7 + - 2558.78 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 256 + - - 4 + - 3802.07 + - - - 256 + - 1024 + - 1 + - 128 + - 256 + - 256 + - 256 + - 1024 + - - 1 + - 361.266 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 448 + - - 6 + - 1342.92 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 64 + - 2368 + - - 7 + - 861.397 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 64 + - 1408 + - - 7 + - 533.997 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 4 + - - 27 + - 253.563 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 5056 + - - 10 + - 4232.24 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1024 + - - 4 + - 2131.41 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 4288 + - - 10 + - 4277.59 + - - - 2944 + - 1408 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 1408 + - - 1 + - 1943.8 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 4 + - 704 + - - 28 + - 35.338 + - - - 64 + - 1408 + - 1 + - 128 + - 64 + - 64 + - 64 + - 1408 + - - 3 + - 151.131 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 6784 + - - 4 + - 3809.69 + - - - 6784 + - 1408 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 1408 + - - 0 + - 2365.06 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 704 + - - 7 + - 3542.33 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 5888 + - - 17 + - 4406.81 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 5888 + - - 27 + - 299.244 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 5888 + - - 10 + - 4351.82 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 4288 + - - 17 + - 4330.78 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 4288 + - - 10 + - 4026.38 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 704 + - 1024 + - - 18 + - 2237.5 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 5056 + - - 10 + - 4263.29 + - - - 448 + - 448 + - 1 + - 128 + - 448 + - 448 + - 448 + - 448 + - - 3 + - 340.176 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 2944 + - - 18 + - 3891.51 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 5056 + - - 18 + - 4129.48 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1408 + - - 4 + - 3598.35 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 2368 + - - 18 + - 3792.02 + - - - 6784 + - 64 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 64 + - - 3 + - 654.126 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 5056 + - - 20 + - 4019.33 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 448 + - - 4 + - 4052.05 + - - - 704 + - 3584 + - 1 + - 128 + - 704 + - 704 + - 704 + - 3584 + - - 0 + - 1618.69 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 448 + - - 4 + - 3986.63 + - - - 128 + - 5888 + - 1 + - 128 + - 128 + - 128 + - 128 + - 5888 + - - 1 + - 891.91 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1856 + - - 17 + - 4117.54 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 704 + - - 4 + - 4106.76 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 4 + - - 27 + - 245.186 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 2368 + - - 9 + - 2680.52 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 2368 + - - 10 + - 4021.64 + - - - 4288 + - 3584 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 3584 + - - 0 + - 2519.38 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 704 + - 5056 + - - 20 + - 3749.64 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 1856 + - - 7 + - 3682.38 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 6784 + - - 18 + - 3883.84 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 6784 + - - 26 + - 293.93 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 448 + - 5888 + - - 18 + - 3609.34 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 2944 + - - 10 + - 4137.99 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 5056 + - - 18 + - 3991.76 + - - - 2368 + - 3584 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 3584 + - - 0 + - 2301.54 + - - - 256 + - 1856 + - 1 + - 128 + - 256 + - 256 + - 256 + - 1856 + - - 1 + - 618.566 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1024 + - - 11 + - 3788.93 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 256 + - - 4 + - 3555.3 + - - - 704 + - 1024 + - 1 + - 128 + - 704 + - 704 + - 704 + - 1024 + - - 3 + - 893.442 + - - - 1024 + - 3584 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 3584 + - - 1 + - 1864.73 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 1408 + - - 10 + - 3973.22 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 4288 + - - 4 + - 3408.06 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 5888 + - - 18 + - 4186.47 + - - - 4 + - 2368 + - 1 + - 128 + - 4 + - 4 + - 4 + - 2368 + - - 25 + - 21.6196 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1856 + - - 20 + - 3843.69 + - - - 1408 + - 1024 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 1024 + - - 1 + - 1363.4 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 128 + - 128 + - - 7 + - 151.968 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 704 + - - 7 + - 3695.08 + - - - 2944 + - 5888 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 5888 + - - 0 + - 2565.43 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 4 + - - 31 + - 25.3124 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1856 + - - 28 + - 225.76 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 64 + - - 4 + - 2012.65 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 4 + - - 27 + - 40.9047 + - - - 4 + - 128 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 25 + - 1.14255 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 2368 + - - 18 + - 3836.34 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 704 + - - 18 + - 3800.79 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1856 + - - 18 + - 2529.24 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 256 + - 4288 + - - 4 + - 3105.86 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1408 + - - 18 + - 3891.51 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3584 + - - 4 + - 3521.42 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 2368 + - - 18 + - 3970.99 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 4288 + - - 4 + - 4071.82 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1856 + - - 18 + - 3848.19 + - - - 704 + - 2368 + - 1 + - 128 + - 704 + - 704 + - 704 + - 2368 + - - 2 + - 1506.11 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 1408 + - - 4 + - 3640.04 + - - - 2944 + - 704 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 704 + - - 1 + - 1502.55 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 6784 + - - 10 + - 4270.68 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 64 + - 1024 + - - 7 + - 604.367 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 2368 + - - 4 + - 3552.7 + - - - 5888 + - 2368 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 2368 + - - 0 + - 2425.89 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 704 + - - 31 + - 67.4635 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 704 + - - 4 + - 3388.18 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 704 + - - 7 + - 3647.13 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 5888 + - - 4 + - 3869.31 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 3584 + - - 20 + - 4239.5 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 128 + - 6784 + - - 7 + - 3237.35 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 4 + - - 28 + - 154.984 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 4288 + - - 18 + - 3993.7 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 704 + - 128 + - - 7 + - 535.982 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 2368 + - - 9 + - 1832.19 + - - - 5056 + - 5888 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 5888 + - - 0 + - 2645.76 + - - - 4 + - 1024 + - 1 + - 128 + - 4 + - 4 + - 4 + - 1024 + - - 24 + - 9.1023 + - - - 5056 + - 1024 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 1024 + - - 0 + - 1991.29 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 4 + - - 27 + - 70.0976 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 4 + - 128 + - - 27 + - 3.33686 + - - - 2944 + - 256 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 256 + - - 3 + - 942.08 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 4 + - 128 + - - 31 + - 7.94055 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 5888 + - - 18 + - 4111.91 + - - - 64 + - 3584 + - 1 + - 128 + - 64 + - 64 + - 64 + - 3584 + - - 3 + - 366.635 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1408 + - - 10 + - 4186.8 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 4288 + - - 17 + - 4328.17 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 4 + - - 27 + - 283.047 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 5056 + - - 10 + - 4255.14 + - - - 64 + - 6784 + - 1 + - 128 + - 64 + - 64 + - 64 + - 6784 + - - 3 + - 593.238 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 6784 + - - 18 + - 3577.38 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3584 + - - 17 + - 4261.24 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1408 + - - 18 + - 3916.76 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 2368 + - - 18 + - 4146.85 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 5888 + - - 18 + - 4023.53 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1024 + - - 18 + - 3312.88 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 128 + - - 18 + - 3464.75 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 4 + - - 31 + - 18.4869 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 7 + - 2245.84 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 5888 + - - 18 + - 4052.77 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 5888 + - - 17 + - 4290.43 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 4 + - - 31 + - 65.9356 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 704 + - 5888 + - - 18 + - 3830.35 + - - - 1408 + - 256 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 256 + - - 3 + - 570.442 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1856 + - - 28 + - 82.6803 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 64 + - - 7 + - 2121.17 + - - - 5888 + - 256 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 256 + - - 1 + - 1272.01 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 7 + - 106.131 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 2944 + - - 10 + - 4169.27 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 704 + - - 18 + - 3340.25 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 704 + - - 4 + - 3509.94 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 5056 + - - 17 + - 4418.77 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1024 + - - 17 + - 3243.02 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 64 + - 128 + - - 14 + - 78.408 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 5888 + - - 17 + - 4295.2 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 448 + - - 4 + - 3950.48 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 2368 + - - 7 + - 4080.47 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 5056 + - - 4 + - 3768.51 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 5056 + - - 20 + - 4242.36 + - - - 448 + - 1024 + - 1 + - 128 + - 448 + - 448 + - 448 + - 1024 + - - 3 + - 675.878 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1856 + - - 19 + - 1369.41 + - - - 4 + - 256 + - 1 + - 128 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 2.30114 + - - - 256 + - 256 + - 1 + - 128 + - 256 + - 256 + - 256 + - 256 + - - 3 + - 110.609 + - - - 256 + - 4 + - 1 + - 128 + - 256 + - 256 + - 256 + - 4 + - - 25 + - 2.47495 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 64 + - - 4 + - 2620.49 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 4 + - 5056 + - - 30 + - 77.4124 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 15 + - 205.201 + - - - 1024 + - 448 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 448 + - - 1 + - 598.698 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 2944 + - - 18 + - 3797.83 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 5056 + - - 4 + - 3639.16 + - - - 256 + - 128 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 3 + - 54.4432 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 6784 + - - 10 + - 4240.62 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 2944 + - - 10 + - 4111.07 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 128 + - - 9 + - 3085.51 + - - - 6784 + - 704 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 704 + - - 0 + - 2080.45 + - - - 4 + - 5056 + - 1 + - 128 + - 4 + - 4 + - 4 + - 5056 + - - 25 + - 45.7044 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 4 + - 2368 + - - 28 + - 99.8147 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1024 + - - 9 + - 1598.53 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 4 + - - 30 + - 173.349 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 5056 + - - 18 + - 3940.89 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 5056 + - - 10 + - 4331.25 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 2368 + - - 18 + - 4108.37 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 5888 + - - 17 + - 4331.86 + - - - 1856 + - 256 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 256 + - - 3 + - 700.016 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 1024 + - - 17 + - 3335.93 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 64 + - - 4 + - 2181.49 + - - - 3584 + - 128 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 3 + - 619.935 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 5888 + - - 18 + - 4130.53 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 6784 + - - 4 + - 3678.56 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 448 + - - 4 + - 3782.24 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 4 + - - 26 + - 291.814 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 6784 + - - 10 + - 4101.34 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1024 + - - 4 + - 3865.52 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 1856 + - - 18 + - 3882.67 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 64 + - - 15 + - 103.819 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 4 + - - 28 + - 136.643 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 5888 + - - 4 + - 3770.73 + - - - 5888 + - 5888 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 5888 + - - 0 + - 2683.46 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 256 + - - 4 + - 4030.52 + - - - 3584 + - 448 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 448 + - - 1 + - 1310.05 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 4 + - 64 + - - 28 + - 4.2965 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 128 + - 4288 + - - 7 + - 1735.54 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 128 + - - 7 + - 2673.75 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 6784 + - - 10 + - 4399.08 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 5888 + - - 4 + - 3959.55 + - - - 1408 + - 1408 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 1408 + - - 1 + - 1424.95 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 64 + - - 8 + - 2768.63 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 5888 + - - 18 + - 3704.65 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 64 + - 2944 + - - 15 + - 1032.42 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1024 + - - 4 + - 1857.26 + - - - 128 + - 128 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 26.8041 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 4288 + - - 17 + - 4073.06 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 6784 + - - 10 + - 4426.76 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 1408 + - - 18 + - 4125.6 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 4288 + - - 18 + - 4117.75 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1024 + - - 17 + - 3585.52 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1856 + - - 17 + - 4271.66 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 5056 + - - 20 + - 4195.67 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1408 + - - 18 + - 3657.61 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 128 + - 4 + - - 31 + - 7.9534 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 5888 + - - 10 + - 4203.36 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 1408 + - - 18 + - 3912.3 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 4288 + - - 18 + - 3756.56 + - - - 1024 + - 2944 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 2944 + - - 1 + - 1734.43 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 2368 + - - 18 + - 3984.42 + - - - 2368 + - 2944 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 2944 + - - 1 + - 2173.05 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1408 + - - 18 + - 4054.06 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 5888 + - - 17 + - 4259.72 + - - - 128 + - 1024 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1024 + - - 3 + - 220.058 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 4 + - - 28 + - 14.9139 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 5888 + - - 4 + - 3444.97 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1856 + - - 7 + - 2088.51 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 448 + - - 4 + - 3408.93 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 2944 + - - 10 + - 4283.69 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 704 + - - 15 + - 996.057 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 4288 + - - 18 + - 3974.62 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 4 + - - 27 + - 139.438 + - - - 6784 + - 5888 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 5888 + - - 0 + - 2722.04 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 2944 + - - 28 + - 282.028 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 2368 + - - 18 + - 4126.13 + - - - 448 + - 6784 + - 1 + - 128 + - 448 + - 448 + - 448 + - 6784 + - - 1 + - 1737.95 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 704 + - - 7 + - 3707.38 + - - - 1024 + - 64 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 64 + - - 1 + - 92.3855 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 5056 + - - 18 + - 4128.06 + - - - 704 + - 704 + - 1 + - 128 + - 704 + - 704 + - 704 + - 704 + - - 3 + - 700.517 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 2944 + - - 7 + - 3898.96 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 4 + - - 26 + - 258.358 + - - - 6784 + - 4288 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 4288 + - - 0 + - 2673.08 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 704 + - - 18 + - 3830.72 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 4 + - 4 + - - 27 + - 0.0992248 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 6784 + - - 10 + - 4409.46 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 128 + - - 14 + - 497.629 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1856 + - - 17 + - 4223.43 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 2927.15 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 2944 + - - 17 + - 4199.12 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 4288 + - - 18 + - 4149.93 + - - - 128 + - 1856 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1856 + - - 3 + - 369.396 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 5888 + - - 10 + - 4360.42 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 5888 + - - 4 + - 3565.61 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1856 + - - 17 + - 4106.84 + - - - 128 + - 2368 + - 1 + - 128 + - 128 + - 128 + - 128 + - 2368 + - - 3 + - 449.459 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1408 + - - 18 + - 3990.43 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 2944 + - - 10 + - 4228.67 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 2368 + - - 4 + - 4100.37 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4288 + - - 18 + - 2549.15 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 4288 + - - 17 + - 4221.65 + - - - 5888 + - 128 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 1 + - 888.624 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3584 + - - 4 + - 3882.04 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1856 + - - 4 + - 3463.89 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 448 + - 5056 + - - 18 + - 3625.35 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1856 + - - 18 + - 3275.04 + - - - 4 + - 3584 + - 1 + - 128 + - 4 + - 4 + - 4 + - 3584 + - - 24 + - 32.3068 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1408 + - - 31 + - 122.009 + - - - 256 + - 2368 + - 1 + - 128 + - 256 + - 256 + - 256 + - 2368 + - - 1 + - 732.025 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 2944 + - - 10 + - 4146.13 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 6784 + - - 10 + - 4364.3 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 128 + - 6784 + - - 18 + - 2542.29 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 64 + - 5056 + - - 7 + - 2282.44 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 5056 + - - 10 + - 4106.76 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 704 + - - 18 + - 3427.21 + - - - 2368 + - 4288 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 4288 + - - 1 + - 2346.73 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 4 + - 6784 + - - 29 + - 99.3538 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5888 + - - 18 + - 2693.16 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 448 + - - 4 + - 3668.9 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 448 + - - 4 + - 3601.24 + - - - 4 + - 704 + - 1 + - 128 + - 4 + - 4 + - 4 + - 704 + - - 25 + - 6.32815 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 1856 + - - 18 + - 4061.62 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 2944 + - - 4 + - 3714.63 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 1408 + - - 10 + - 4141.17 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1408 + - - 18 + - 3321.05 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 1024 + - - 13 + - 3807.84 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1024 + - - 18 + - 2378.06 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 5888 + - - 4 + - 3035.25 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 2368 + - - 10 + - 4106.78 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3584 + - - 17 + - 4111.9 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 2368 + - - 7 + - 4162.42 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 2944 + - - 7 + - 3682.23 + - - - 1024 + - 256 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 256 + - - 3 + - 397.188 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 2368 + - - 4 + - 3410.77 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 4 + - 4288 + - - 27 + - 158.022 + - - - 5056 + - 1408 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 1408 + - - 1 + - 2206.11 + - - - 1408 + - 64 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 64 + - - 3 + - 155.198 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 6784 + - - 10 + - 4326.23 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 4 + - - 28 + - 0.664939 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1408 + - - 7 + - 1959.72 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 1408 + - - 18 + - 3914.63 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1024 + - - 15 + - 1350.82 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1024 + - - 7 + - 2965.67 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 5888 + - - 7 + - 3203.15 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 3584 + - - 4 + - 3683.17 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 4 + - 1408 + - - 28 + - 64.3657 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 704 + - - 18 + - 3000.35 + - - - 1024 + - 128 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 3 + - 217.999 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 704 + - 448 + - - 7 + - 2231.22 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 448 + - - 4 + - 3661.0 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 128 + - - 7 + - 1524.35 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 256 + - 3584 + - - 4 + - 3395.54 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 448 + - 3584 + - - 18 + - 2731.54 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 256 + - - 18 + - 2832.88 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1856 + - - 7 + - 2300.2 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 2944 + - - 10 + - 4303.65 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1856 + - - 18 + - 3877.93 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 3584 + - - 10 + - 3871.18 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 2944 + - - 4 + - 3705.46 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 448 + - 128 + - - 7 + - 531.373 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 704 + - - 7 + - 3091.13 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 5056 + - - 27 + - 354.839 + - - - 64 + - 4 + - 1 + - 128 + - 64 + - 64 + - 64 + - 4 + - - 25 + - 0.615946 + - - - 5056 + - 448 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 448 + - - 1 + - 1577.08 + - - - 64 + - 5888 + - 1 + - 128 + - 64 + - 64 + - 64 + - 5888 + - - 3 + - 523.833 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 5056 + - - 17 + - 4123.63 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1024 + - - 17 + - 3604.78 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 704 + - - 7 + - 2696.88 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1856 + - - 18 + - 4007.26 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 256 + - 256 + - - 4 + - 604.948 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1856 + - - 7 + - 2542.53 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 128 + - - 7 + - 2534.06 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 5056 + - - 17 + - 4106.94 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 4 + - - 30 + - 221.927 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 4 + - 1914.97 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 5888 + - - 18 + - 3954.83 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 128 + - - 7 + - 3874.94 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 64 + - - 9 + - 2566.05 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 2944 + - - 10 + - 4295.21 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 64 + - 5888 + - - 7 + - 2658.04 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 2944 + - - 18 + - 3684.16 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1408 + - - 18 + - 3964.21 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 18 + - 2981.91 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 448 + - - 16 + - 687.467 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 3584 + - - 20 + - 3467.39 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1408 + - - 18 + - 4066.8 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 256 + - - 4 + - 3403.34 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 2368 + - - 18 + - 3993.31 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 64 + - - 7 + - 1088.1 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 1024 + - - 13 + - 3701.79 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 3584 + - - 10 + - 4046.01 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1408 + - - 7 + - 2930.68 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 1408 + - - 18 + - 4185.7 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1408 + - - 18 + - 3911.48 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 2368 + - - 4 + - 3656.94 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 4288 + - - 17 + - 4350.7 + - - - 4288 + - 2368 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 2368 + - - 1 + - 2350.8 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 704 + - 4288 + - - 7 + - 3613.47 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 448 + - 1408 + - - 4 + - 1992.6 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 128 + - - 5 + - 1235.38 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 448 + - - 5 + - 751.612 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 4288 + - - 20 + - 4328.85 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 4 + - - 28 + - 182.754 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 3584 + - - 7 + - 3720.27 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 4 + - 448 + - - 30 + - 9.36993 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 448 + - 5888 + - - 18 + - 3352.28 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3584 + - - 20 + - 4163.88 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 4288 + - - 18 + - 3972.85 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 4 + - - 31 + - 48.6052 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 704 + - - 18 + - 3502.51 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 4 + - 448 + - - 28 + - 24.4364 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 448 + - - 7 + - 672.164 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 448 + - - 18 + - 2538.89 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 5056 + - - 7 + - 2613.88 + - - - 4 + - 2944 + - 1 + - 128 + - 4 + - 4 + - 4 + - 2944 + - - 25 + - 26.8401 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 704 + - - 16 + - 603.621 + - - - 1856 + - 3584 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 3584 + - - 0 + - 2189.48 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 18 + - 2672.27 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 4 + - - 28 + - 84.4436 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 448 + - 4288 + - - 18 + - 3766.71 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 64 + - - 15 + - 1227.43 + - - - 704 + - 256 + - 1 + - 128 + - 704 + - 704 + - 704 + - 256 + - - 3 + - 302.262 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 4 + - - 28 + - 28.4941 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5056 + - - 18 + - 2927.12 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 704 + - - 18 + - 3988.26 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 64 + - - 19 + - 1144.93 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 4 + - - 27 + - 209.371 + - - - 64 + - 704 + - 1 + - 128 + - 64 + - 64 + - 64 + - 704 + - - 3 + - 69.7866 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 3584 + - - 17 + - 3866.47 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 704 + - - 4 + - 2153.94 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 128 + - - 16 + - 419.43 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 4288 + - - 4 + - 3776.96 + - - - 1408 + - 448 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 448 + - - 3 + - 856.026 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 1856 + - - 4 + - 3799.76 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 128 + - 2368 + - - 7 + - 2139.56 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1856 + - - 4 + - 3641.63 + - - - 2944 + - 2368 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 2368 + - - 1 + - 2182.4 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 64 + - 128 + - - 15 + - 51.7049 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 128 + - 64 + - - 14 + - 80.0847 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 6784 + - - 10 + - 4175.93 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 128 + - - 7 + - 747.648 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 1024 + - - 20 + - 4157.98 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 256 + - - 7 + - 1941.81 + - - - 1024 + - 4 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 4 + - - 25 + - 9.55344 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 2368 + - - 18 + - 4019.02 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1024 + - - 20 + - 3915.08 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 704 + - 448 + - - 15 + - 1635.74 + - - - 4 + - 4288 + - 1 + - 128 + - 4 + - 4 + - 4 + - 4288 + - - 25 + - 38.4362 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 2944 + - - 18 + - 3914.16 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 448 + - 4288 + - - 18 + - 3411.36 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 128 + - 1408 + - - 7 + - 1623.03 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 4 + - - 28 + - 92.8648 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 3584 + - - 10 + - 4087.28 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 4 + - - 28 + - 126.918 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 1408 + - - 4 + - 3333.04 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 5888 + - - 10 + - 4186.47 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1856 + - - 7 + - 3920.22 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 3584 + - - 10 + - 3797.02 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 448 + - - 4 + - 3698.96 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 4288 + - - 18 + - 3913.84 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 64 + - - 5 + - 635.551 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 128 + - - 7 + - 1843.83 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 1024 + - - 20 + - 3956.24 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 3584 + - - 4 + - 3815.84 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 4 + - - 28 + - 120.394 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 5888 + - - 4 + - 3142.02 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 704 + - - 20 + - 3754.17 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 4288 + - - 18 + - 4043.43 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 5056 + - - 18 + - 4118.79 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 5888 + - - 10 + - 4234.81 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 4 + - - 26 + - 89.7219 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 64 + - 2944 + - - 4 + - 1673.26 + - - - 256 + - 4288 + - 1 + - 128 + - 256 + - 256 + - 256 + - 4288 + - - 1 + - 1059.97 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 1024 + - - 18 + - 2901.72 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 5888 + - - 20 + - 4413.53 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 4 + - - 28 + - 180.727 + - - - 4288 + - 256 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 256 + - - 1 + - 1092.95 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 128 + - - 7 + - 2040.33 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 5056 + - - 10 + - 4265.22 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 4288 + - - 17 + - 4100.33 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 64 + - 3584 + - - 7 + - 1229.49 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 6784 + - - 10 + - 4374.0 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1408 + - - 7 + - 3717.89 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 1856 + - - 4 + - 4119.35 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 5056 + - - 18 + - 4069.48 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 64 + - - 15 + - 389.805 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 704 + - - 18 + - 3221.88 + - - - 3584 + - 2368 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 2368 + - - 0 + - 2305.45 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 6784 + - - 18 + - 4073.09 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 5888 + - - 20 + - 4158.91 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 128 + - - 18 + - 2277.36 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 5888 + - - 18 + - 3944.64 + - - - 256 + - 704 + - 1 + - 128 + - 256 + - 256 + - 256 + - 704 + - - 3 + - 295.752 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 4 + - 5888 + - - 27 + - 195.758 + - - - 1856 + - 5056 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 5056 + - - 0 + - 2302.46 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 2944 + - - 18 + - 3542.75 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 64 + - 256 + - - 7 + - 150.657 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1419.74 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 1024 + - - 18 + - 3710.99 + - - - 704 + - 5888 + - 1 + - 128 + - 704 + - 704 + - 704 + - 5888 + - - 1 + - 1948.37 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 2944 + - - 10 + - 4226.01 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 64 + - - 9 + - 1970.18 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 6784 + - - 10 + - 4370.09 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 2744.47 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1856 + - - 10 + - 4075.23 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 1856 + - - 4 + - 3598.24 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 64 + - - 7 + - 3009.28 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 4 + - - 28 + - 211.534 + - - - 5888 + - 64 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 64 + - - 3 + - 551.63 + - - - 128 + - 6784 + - 1 + - 128 + - 128 + - 128 + - 128 + - 6784 + - - 1 + - 998.823 + - - - 64 + - 2944 + - 1 + - 128 + - 64 + - 64 + - 64 + - 2944 + - - 3 + - 309.831 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 6784 + - - 10 + - 4276.65 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 4 + - - 28 + - 67.3416 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 1024 + - - 18 + - 3114.05 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 64 + - 4288 + - - 15 + - 1423.31 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 3584 + - - 7 + - 3652.59 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 1408 + - - 18 + - 3664.19 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 448 + - - 18 + - 3368.74 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 1408 + - - 18 + - 3186.28 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 448 + - 256 + - - 7 + - 1064.8 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4 + - - 31 + - 5.841 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 704 + - - 21 + - 3164.76 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 4288 + - - 17 + - 4291.33 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 64 + - - 15 + - 1405.09 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1856 + - - 7 + - 3677.4 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 4 + - - 28 + - 11.0818 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 3584 + - - 17 + - 4209.17 + - - - 2368 + - 256 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 256 + - - 3 + - 808.277 + - - - 1408 + - 128 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 3 + - 304.819 + - - - 448 + - 2368 + - 1 + - 128 + - 448 + - 448 + - 448 + - 2368 + - - 1 + - 1054.93 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 64 + - 5056 + - - 7 + - 1607.87 + - - - 3584 + - 1024 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 1024 + - - 0 + - 1824.74 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 704 + - - 4 + - 3776.44 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 4 + - - 28 + - 68.489 + - - - 256 + - 6784 + - 1 + - 128 + - 256 + - 256 + - 256 + - 6784 + - - 1 + - 1435.29 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1408 + - - 7 + - 3736.07 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 5888 + - - 17 + - 4115.57 + - - - 2368 + - 5056 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 5056 + - - 0 + - 2383.21 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 1024 + - - 4 + - 2242.02 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 128 + - - 19 + - 1111.51 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 2944 + - - 10 + - 3834.15 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 128 + - - 7 + - 3193.63 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 6784 + - - 10 + - 4178.48 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 128 + - - 7 + - 2794.79 + - - - 1408 + - 4288 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 4288 + - - 1 + - 2123.08 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 128 + - 256 + - - 7 + - 306.601 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 15 + - 1296.54 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 448 + - - 18 + - 3357.61 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 2368 + - - 18 + - 4116.64 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 64 + - 2368 + - - 7 + - 1372.55 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 128 + - - 16 + - 761.11 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 6784 + - - 17 + - 4193.89 + - - - 2944 + - 6784 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 6784 + - - 0 + - 2565.87 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 704 + - 704 + - - 7 + - 1574.95 + - - - 5888 + - 4288 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 4288 + - - 0 + - 2655.04 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 6784 + - - 10 + - 4339.4 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 2368 + - - 18 + - 4127.46 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 64 + - - 7 + - 691.107 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2368 + - - 7 + - 1907.44 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 64 + - - 28 + - 10.779 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 4288 + - - 18 + - 3960.64 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 4288 + - - 9 + - 2403.45 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 64 + - 704 + - - 15 + - 277.268 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 2368 + - - 18 + - 3444.06 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 64 + - - 4 + - 2416.76 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 128 + - - 9 + - 2229.35 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 4288 + - - 18 + - 4119.95 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 448 + - 3584 + - - 7 + - 3376.58 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 5056 + - - 18 + - 4105.8 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 1408 + - - 9 + - 2152.55 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 4 + - - 28 + - 46.2985 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 256 + - 1856 + - - 4 + - 3310.09 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 704 + - - 18 + - 4066.38 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 448 + - - 4 + - 3161.54 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 1024 + - - 28 + - 133.853 + - - - 5056 + - 6784 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 6784 + - - 0 + - 2650.05 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 1408 + - - 18 + - 4011.33 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 64 + - - 14 + - 267.105 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 448 + - 5056 + - - 18 + - 3308.21 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 448 + - - 7 + - 3300.01 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 128 + - 4288 + - - 4 + - 2374.54 + - - - 64 + - 1856 + - 1 + - 128 + - 64 + - 64 + - 64 + - 1856 + - - 3 + - 200.903 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 448 + - 704 + - - 15 + - 1617.39 + - - - 1024 + - 704 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 704 + - - 1 + - 863.348 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 2368 + - - 18 + - 3858.51 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 448 + - - 4 + - 3970.16 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 18 + - 2595.94 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 3584 + - - 17 + - 4197.7 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 18 + - 2575.32 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 448 + - 2944 + - - 18 + - 3018.97 + - - - 704 + - 4 + - 1 + - 128 + - 704 + - 704 + - 704 + - 4 + - - 25 + - 6.73489 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 6784 + - - 10 + - 4438.7 + - - - 3584 + - 64 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 64 + - - 3 + - 356.659 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 1856 + - - 18 + - 3839.48 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 128 + - - 7 + - 2082.79 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 448 + - - 18 + - 3786.05 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 3584 + - - 27 + - 230.861 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 448 + - 2368 + - - 7 + - 3014.0 + - - - 448 + - 128 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 3 + - 96.0737 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 64 + - 5888 + - - 7 + - 1838.2 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 5056 + - - 27 + - 281.204 + - - - 5888 + - 4 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 4 + - - 25 + - 53.3006 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 3584 + - - 20 + - 3925.59 + - - - 6784 + - 1856 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 1856 + - - 0 + - 2488.06 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 5056 + - - 4 + - 3864.28 + - - - 2368 + - 1408 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 1408 + - - 1 + - 1847.81 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 2944 + - - 18 + - 3837.0 + - - - 4 + - 5888 + - 1 + - 128 + - 4 + - 4 + - 4 + - 5888 + - - 25 + - 53.3006 + - - - 3584 + - 704 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 704 + - - 0 + - 1617.39 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 64 + - 6784 + - - 7 + - 2121.17 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 6784 + - - 10 + - 4184.16 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 5888 + - - 17 + - 4400.03 + - - - 5056 + - 1856 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 1856 + - - 0 + - 2343.06 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 5056 + - - 10 + - 4207.39 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 4288 + - - 10 + - 4239.34 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 2368 + - - 18 + - 4166.18 + - - - 5056 + - 704 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 704 + - - 0 + - 1811.41 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 448 + - - 7 + - 2158.31 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 448 + - 6784 + - - 18 + - 3373.41 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 5888 + - - 4 + - 3950.3 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 4 + - - 28 + - 21.0051 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 3262.14 + - - - 704 + - 2944 + - 1 + - 128 + - 704 + - 704 + - 704 + - 2944 + - - 1 + - 1424.45 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 4 + - - 28 + - 104.639 + - - - 6784 + - 448 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 448 + - - 1 + - 1754.25 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1856 + - - 20 + - 4114.19 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 2368 + - - 17 + - 3927.57 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 2368 + - - 18 + - 4063.18 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 6784 + - - 20 + - 3960.15 +- null diff --git a/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml new file mode 100644 index 000000000..9b10ef812 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml @@ -0,0 +1,18412 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 64 + LSCB: 8 + LSPA: 4 + LSPB: 32 + LVCA: 16 + LVCB: 2 + LVPA: 1 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 1024 + LdsOffsetA: 0 + LdsOffsetB: 512 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x8_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 16 + LSPA: 8 + LSPB: 16 + LVCA: 8 + LVCB: 4 + LVPA: 2 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x32x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 8 + LSPA: 8 + LSPB: 32 + LVCA: 8 + LVCB: 2 + LVPA: 2 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 1792 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 256 + LdsOffsetB_Blk: 1280 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x64x8_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 64 + LSCB: 8 + LSPA: 4 + LSPB: 32 + LVCA: 16 + LVCB: 2 + LVPA: 1 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 1792 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 256 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x8_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU8_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x64x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 8 + LSPA: 2 + LSPB: 32 + LVCA: 128 + LVCB: 8 + LVPA: 2 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 8 + LSPA: 4 + LSPB: 32 + LVCA: 64 + LVCB: 8 + LVPA: 4 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 9 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 10 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 8 + LSPA: 8 + LSPB: 32 + LVCA: 32 + LVCB: 8 + LVPA: 8 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 256 + LdsOffsetA: 0 + LdsOffsetA_Blk: 512 + LdsOffsetB: 256 + LdsOffsetB_Blk: 768 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 11 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x32x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 12 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x128x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 4 + LSPB: 16 + LVCA: 64 + LVCB: 16 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 13 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x16_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 8 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 14 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x64x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 15 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 8 + LSPA: 8 + LSPB: 32 + LVCA: 32 + LVCB: 8 + LVPA: 8 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 256 + LdsNumElementsAlignedB: 256 + LdsOffsetA: 0 + LdsOffsetA_Blk: 512 + LdsOffsetB: 256 + LdsOffsetB_Blk: 768 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 16 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT32x32x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 32 + LSPA: 16 + LSPB: 32 + LVCA: 16 + LVCB: 8 + LVPA: 4 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 17 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 8 + LSPA: 8 + LSPB: 128 + LVCA: 32 + LVCB: 2 + LVPA: 2 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 18 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x128x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 8 + LSPA: 4 + LSPB: 32 + LVCA: 64 + LVCB: 8 + LVPA: 4 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 19 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 2 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 4 + LSPA: 4 + LSPB: 16 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 20 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT16x16x4_SE_AMAS2_GRVW2_GSU1_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 4 + LSPA: 4 + LSPB: 16 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 21 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT16x16x4_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 22 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 23 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU4_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 24 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU8_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 25 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 26 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 39.3642 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4148.36 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4141.24 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4378.86 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 2352.57 + - - - 256 + - 1856 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 566.059 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 3523.35 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3995.42 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4359.77 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4346.04 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 3978.89 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3629.13 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3966.27 + - - - 448 + - 256 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 165.764 + - - - 4 + - 2944 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 27.2674 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 23 + - 99.9254 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 3976.72 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3528.86 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 39.961 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 24 + - 93.5274 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 1106.68 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4171.94 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3639.65 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1297.17 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 2622.29 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 65.341 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 3218.49 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 18 + - 3755.41 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 495.056 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4461.2 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 14 + - 3094.35 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4145.09 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3864.15 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 5 + - 249.844 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 16 + - 1329.78 + - - - 3584 + - 4 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 20 + - 32.3523 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 2345.97 + - - - 5888 + - 448 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1423.93 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4439.33 + - - - 6784 + - 2368 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2220.39 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3947.86 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 24.7172 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 2112.24 + - - - 1408 + - 1024 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1158.65 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 3849.86 + - - - 256 + - 6784 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 4 + - 1291.23 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 14 + - 3495.93 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 26 + - 101.342 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 1271.77 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3546.14 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3935.55 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3944.24 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4127.22 + - - - 704 + - 128 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 132.884 + - - - 5056 + - 4 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 20 + - 45.1937 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 2893.12 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4278.74 + - - - 3584 + - 1024 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 1605.26 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 23 + - 60.3621 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4178.75 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4276.36 + - - - 4288 + - 1024 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 3 + - 1766.53 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 21.3472 + - - - 128 + - 448 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 84.6406 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4300.5 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4416.4 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 65.5694 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 19 + - 2812.03 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 22 + - 158.641 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4160.45 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 6 + - 3209.78 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 18 + - 3848.87 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3625.97 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 73.0438 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 3278.28 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4292.92 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 2943.86 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 3706.58 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 12 + - 3301.71 + - - - 1024 + - 3584 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 0 + - 1616.3 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 1495.38 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 3830.45 + - - - 4288 + - 6784 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2429.72 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 1553.95 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 1775.29 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 26 + - 9.55733 + - - - 6784 + - 4288 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 2377.59 + - - - 1856 + - 128 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 1 + - 346.183 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 135.234 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4349.99 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 25 + - 151.063 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 3.21886 + - - - 128 + - 5056 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 704.401 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2829.71 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3600.97 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 5 + - 408.618 + - - - 256 + - 704 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 258.154 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 18 + - 4157.3 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 23 + - 138.875 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4203.55 + - - - 704 + - 2944 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 1300.95 + - - - 1408 + - 4288 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1839.3 + - - - 448 + - 6784 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 0 + - 1549.64 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 0.0975238 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 13 + - 271.652 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4388.28 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 97.8807 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4382.68 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 3797.64 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 3968.1 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 14 + - 3953.56 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 23 + - 114.655 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 1781.3 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4428.42 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 6 + - 3798.7 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 14 + - 4183.52 + - - - 704 + - 4 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 20 + - 6.61621 + - - - 64 + - 64 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 2 + - 4.36035 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 80.2595 + - - - 1856 + - 704 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 1114.99 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 3858.52 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 13 + - 732.876 + - - - 128 + - 128 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 26.5866 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 6 + - 2114.45 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 3203.57 + - - - 1408 + - 64 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 135.634 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3906.42 + - - - 5888 + - 128 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 1 + - 889.935 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 3342.88 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4165.82 + - - - 5056 + - 1024 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 3 + - 1808.68 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 13 + - 450.388 + - - - 6784 + - 5888 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 2462.27 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4447.72 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 563.751 + - - - 3584 + - 6784 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 2150.84 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4496.73 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 3243.21 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 23 + - 210.041 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 18 + - 3774.26 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3927.19 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 26 + - 181.189 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4209.42 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 10 + - 3117.73 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 23 + - 157.418 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 16 + - 140.184 + - - - 128 + - 4288 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 578.894 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3493.17 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4340.86 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 26 + - 4.38075 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 10 + - 3334.59 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 6 + - 3135.25 + - - - 3584 + - 5056 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 2084.49 + - - - 4288 + - 128 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 1 + - 655.849 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3755.13 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 516.771 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 2670.14 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 16 + - 1180.07 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4437.93 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 10 + - 3173.32 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3263.61 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 1769.85 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 202.038 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 6 + - 2413.33 + - - - 64 + - 448 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 41.9718 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 3835.24 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 13 + - 495.948 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 3972.23 + - - - 448 + - 1024 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 620.984 + - - - 4 + - 2368 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 21.9961 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 2690.8 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3930.42 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 23 + - 248.798 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 18 + - 3950.24 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 3832.07 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 10 + - 2942.24 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4047.77 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 10 + - 3152.45 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 6 + - 3149.26 + - - - 1856 + - 5888 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 2094.77 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 105.703 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 71.2817 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3975.85 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 8 + - 2131.59 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 24 + - 7.86612 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4294.26 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 13 + - 961.688 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4222.89 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3188.17 + - - - 4 + - 4288 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 39.487 + - - - 5888 + - 3584 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2215.93 + - - - 2944 + - 1856 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 1801.47 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 10 + - 3608.14 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3600.47 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 10 + - 3588.68 + - - - 2944 + - 5888 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2232.72 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 3020.64 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 13 + - 393.292 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 23 + - 173.349 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 9 + - 1733.22 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 15 + - 1336.9 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 6 + - 2914.61 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2076.84 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 2823.23 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4322.48 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 10 + - 2184.53 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 2915.69 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 10 + - 2959.69 + - - - 4288 + - 4288 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 2273.68 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4245.39 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 10.6603 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 2470.53 + - - - 64 + - 704 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 68.0091 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 2846.6 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4304.64 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 3915.62 + - - - 64 + - 1856 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 173.249 + - - - 1024 + - 2368 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1325.5 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 90.7877 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 6 + - 3329.39 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 2678.84 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 3695.81 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 2688.39 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4392.89 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 6 + - 1744.98 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 17 + - 2494.4 + - - - 2368 + - 5056 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2146.35 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4221.01 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 3916.54 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 976.068 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4392.5 + - - - 2368 + - 5888 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2196.37 + - - - 448 + - 5888 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 3 + - 1587.85 + - - - 5888 + - 5056 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 2304.61 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 3644.58 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 10 + - 3128.24 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 1993.93 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 14 + - 3564.64 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 201.514 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 17.9797 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 3717.36 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4171.27 + - - - 4 + - 3584 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 32.9566 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 3919.12 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 2831.87 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4244.99 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4410.19 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 10 + - 3108.37 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 2749.61 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 1240.16 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1864.53 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 2205.8 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3329.61 + - - - 1408 + - 3584 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1709.88 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 2436.09 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4242.39 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4521.32 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 3915.63 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4461.97 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 2469.07 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 16 + - 998.273 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 11 + - 276.205 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 2617.02 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 1499.64 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 4060.31 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 657.709 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 15.0542 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 6 + - 2840.92 + - - - 6784 + - 64 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 1 + - 530.696 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 10 + - 3206.42 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4440.8 + - - - 3584 + - 448 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1272.42 + - - - 2944 + - 64 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 266.077 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4151.19 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2438.61 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 14 + - 3926.02 + - - - 128 + - 1024 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 192.223 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4295.68 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 10 + - 2676.72 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3552.7 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4144.37 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 4.25927 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4226.4 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 25 + - 50.5815 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 6 + - 3583.98 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3932.54 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 3876.18 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 3975.39 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 22 + - 201.474 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4303.81 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 18 + - 3948.45 + - - - 2944 + - 1408 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 1626.35 + - - - 128 + - 1856 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 340.905 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 561.737 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3415.51 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 10 + - 2575.28 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 2747.73 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 3696.24 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3530.4 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4233.41 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 6 + - 1706.87 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 2627.96 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3763.53 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 14 + - 3897.5 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 6 + - 1855.11 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4059.38 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 10 + - 3584.42 + - - - 4288 + - 1856 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 1994.62 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 12 + - 3890.5 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4239.18 + - - - 1024 + - 64 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 98.4578 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 3142.6 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 2056.9 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4506.24 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4184.67 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 11 + - 970.904 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 91.476 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3846.05 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 18 + - 3941.4 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 3595.46 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 2291.53 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4238.22 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 3586.47 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4354.21 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4417.73 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 6 + - 2720.28 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 6 + - 3541.9 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 6 + - 3540.4 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 14 + - 3855.64 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 6 + - 3623.32 + - - - 704 + - 1856 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 1113.8 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4235.17 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 17 + - 2476.9 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 2180.82 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 5 + - 418.915 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4489.82 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 3072.11 + - - - 2944 + - 128 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 529.817 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 7.81431 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 13 + - 608.718 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 18 + - 4044.3 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 6 + - 3246.72 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4082.81 + - - - 64 + - 256 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 25.1578 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 5 + - 159.566 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 392.725 + - - - 1024 + - 1856 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1374.72 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3578.29 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 23 + - 167.084 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 12 + - 3782.92 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 2953.84 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 11 + - 1221.3 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 24 + - 85.7646 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 14 + - 3822.29 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 14 + - 4035.35 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3622.28 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 105.703 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4212.77 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4118.16 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4303.36 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 15 + - 1379.2 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 10 + - 2825.13 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 6 + - 3716.14 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 10 + - 2978.52 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 521.444 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 22 + - 66.9038 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 7 + - 2534.09 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 23 + - 69.0395 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 2226.06 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 10 + - 2539.8 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3202.47 + - - - 5056 + - 448 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 1 + - 1353.3 + - - - 1024 + - 5888 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1719.9 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 6 + - 1010.03 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 10 + - 3609.36 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 12 + - 3814.24 + - - - 256 + - 4288 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 888.849 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4379.88 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3514.27 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 79.771 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 5 + - 76.9503 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 92.4762 + - - - 128 + - 2368 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 420.978 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1999.08 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 45.9277 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 5 + - 94.588 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 3517.46 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4316.26 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4312.31 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4191.83 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 6 + - 3782.12 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 2849.78 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 3779.48 + - - - 4288 + - 5888 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2406.56 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4211.53 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 3569.22 + - - - 448 + - 1408 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 746.49 + - - - 6784 + - 1024 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 1923.0 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 8 + - 2457.45 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3654.89 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3772.87 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 2880.86 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4418.24 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 6 + - 1439.07 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4417.68 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3951.13 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 16 + - 138.578 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 17 + - 2014.94 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 25 + - 25.2062 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 3597.68 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 3504.14 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 23 + - 41.3512 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 1284.63 + - - - 704 + - 5888 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 4 + - 1659.31 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 3887.89 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 81.5378 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 6 + - 3208.12 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4347.12 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4512.11 + - - - 448 + - 2368 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 939.337 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 11 + - 379.919 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 775.852 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 16 + - 1058.47 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3465.95 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 9.24903 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 492.84 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 6 + - 2224.25 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4385.55 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 16 + - 37.8092 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 10 + - 2250.46 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 10 + - 3429.53 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 13 + - 916.095 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4265.58 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4450.36 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 14 + - 3615.24 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 3868.07 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 246.862 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3836.6 + - - - 5056 + - 1408 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 4 + - 1943.71 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 24 + - 21.0466 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4084.72 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4518.51 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 3336.42 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 9 + - 1613.47 + - - - 1856 + - 1856 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 0 + - 1728.31 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 3295.03 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4397.48 + - - - 2944 + - 6784 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2257.53 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 3641.76 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4233.8 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4194.07 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 11 + - 989.223 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3771.56 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 1509.73 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4343.82 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 8 + - 2418.79 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 2832.56 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 6 + - 3533.44 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4380.48 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 777.945 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 14 + - 3929.17 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 6 + - 725.658 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3370.57 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 3903.04 + - - - 2368 + - 4288 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2041.26 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4414.07 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3757.27 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3982.92 + - - - 2944 + - 448 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 1108.91 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 15 + - 1124.25 + - - - 448 + - 704 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 443.433 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 25 + - 3.30323 + - - - 1408 + - 6784 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 2013.04 + - - - 256 + - 5888 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 4 + - 1154.49 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3292.65 + - - - 256 + - 3584 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 958.229 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 3416.79 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 6 + - 3384.32 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 3973.34 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 6 + - 1933.44 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 2332.89 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4230.03 + - - - 5888 + - 2368 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2132.33 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 6 + - 2615.92 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 14 + - 3438.0 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4243.46 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 23 + - 302.085 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 6 + - 1522.25 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 121.538 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 3345.79 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 18 + - 3273.88 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 25 + - 307.163 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 3218.49 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 3510.95 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4268.16 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 13 + - 1152.42 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 26 + - 47.7204 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 23 + - 214.8 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4060.66 + - - - 128 + - 2944 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 525.659 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 3013.8 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 15 + - 1432.97 + - - - 704 + - 1408 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 923.687 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 2731.29 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 3120.22 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4366.64 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 10 + - 2368.66 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4352.55 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1004.69 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 6 + - 3286.94 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 25 + - 1.76172 + - - - 64 + - 1024 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 99.297 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 3319.88 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 24 + - 116.381 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 273.585 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 10 + - 2666.68 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 10 + - 2224.84 + - - - 1024 + - 448 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 601.149 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 10 + - 3212.27 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 2181.4 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 1299.12 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 1908.98 + - - - 4288 + - 4 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 20 + - 38.7619 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 14 + - 3832.99 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 15 + - 1038.99 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 2190.88 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3432.84 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 3870.09 + - - - 2944 + - 2368 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 1884.48 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 3727.33 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4358.94 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 24 + - 10.9677 + - - - 5888 + - 704 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1604.32 + - - - 448 + - 64 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 43.197 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 3534.46 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 6 + - 3293.39 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 10 + - 3103.89 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 23 + - 32.9956 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 2820.58 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4446.3 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 11 + - 344.926 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 11 + - 1547.79 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 6 + - 2000.91 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 3351.24 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4178.59 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3545.33 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4141.26 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4259.14 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 984.158 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 2913.52 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4297.31 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4477.42 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 67.2809 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 6 + - 3337.14 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 10 + - 3144.55 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 10 + - 3098.55 + - - - 1024 + - 6784 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1787.25 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4349.64 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 10 + - 3313.18 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 10 + - 3425.19 + - - - 4288 + - 5056 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2329.32 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 9 + - 1266.43 + - - - 1856 + - 1408 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 1568.34 + - - - 256 + - 5056 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 4 + - 996.122 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 26 + - 202.288 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 6 + - 2826.71 + - - - 128 + - 4 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 20 + - 1.23189 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 14 + - 3633.59 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4358.39 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 18 + - 3731.07 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4024.81 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4372.03 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4060.18 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 10 + - 2647.14 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 18 + - 3947.28 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4492.65 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 18 + - 3960.85 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4383.11 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 6 + - 2070.53 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 3467.13 + - - - 4288 + - 2944 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 2180.76 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4086.64 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 564.256 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3691.13 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 3987.26 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 9 + - 2531.63 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3372.86 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 3945.45 + - - - 2944 + - 3584 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2092.22 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 1460.74 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 6 + - 1849.25 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 282.889 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4195.95 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 16 + - 814.654 + - - - 5888 + - 6784 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 2353.9 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 2552.92 + - - - 64 + - 128 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 12.1814 + - - - 1856 + - 64 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 1 + - 168.637 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 979.146 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 4112.19 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 8 + - 3172.45 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 6 + - 1523.51 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 10 + - 2662.93 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 6 + - 1486.98 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 1708.47 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 22 + - 332.409 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 4138.04 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 2614.24 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 2441.02 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 4056.55 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 8 + - 3024.66 + - - - 4288 + - 448 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 1515.6 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 3160.85 + - - - 4 + - 5056 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 46.6264 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 12 + - 3921.5 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4348.85 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 3309.52 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4235.52 + - - - 128 + - 3584 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 539.708 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 24 + - 183.04 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 3464.05 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 26 + - 48.6052 + - - - 5888 + - 2944 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2187.64 + - - - 704 + - 4288 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 0 + - 1607.32 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 1706.16 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 22 + - 281.542 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2316.59 + - - - 2944 + - 5056 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2208.65 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4499.82 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3518.86 + - - - 1408 + - 5056 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1909.5 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1775.3 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4379.72 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4407.8 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 12 + - 4012.21 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 3513.99 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3831.94 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 10 + - 3301.36 + - - - 704 + - 1024 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 848.113 + - - - 2944 + - 704 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 1280.36 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1559.3 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 10 + - 3462.9 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 5.68889 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 10 + - 3289.3 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4329.8 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 12 + - 3275.05 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4383.11 + - - - 256 + - 2368 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 664.793 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4146.56 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4314.91 + - - - 4288 + - 2368 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 3 + - 2044.34 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4227.47 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4017.22 + - - - 5056 + - 3584 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 4 + - 2242.14 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4308.74 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 2379.99 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4227.82 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 3798.69 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 0.668277 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3510.93 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 6 + - 3448.82 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 6 + - 2370.69 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 24 + - 155.855 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 2857.03 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 10 + - 2655.11 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 6 + - 2818.45 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4213.1 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 83.6475 + - - - 6784 + - 128 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 1 + - 1004.6 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 2831.61 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4297.78 + - - - 1024 + - 1408 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1159.23 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 23 + - 185.328 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4432.48 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 386.928 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4289.42 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 24 + - 99.6136 + - - - 4 + - 448 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 3.9385 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4357.62 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4357.97 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 24.487 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 10 + - 3368.68 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 3911.17 + - - - 4288 + - 704 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 1564.63 + - - - 2368 + - 2944 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 1937.85 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 6 + - 668.03 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 18 + - 4099.15 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 26 + - 13.8209 + - - - 64 + - 4 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 20 + - 0.605028 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4208.25 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 10 + - 3571.36 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 10 + - 3114.19 + - - - 5888 + - 256 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1215.59 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 3113.73 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 10 + - 2792.9 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 3333.13 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 10 + - 2753.42 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4383.9 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 153.553 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 205.201 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 10 + - 2245.55 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3384.11 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4458.04 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4394.43 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 14 + - 3195.11 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 12 + - 4090.84 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 2964.02 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 774.463 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4395.23 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3946.17 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4313.43 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 66.8912 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4439.79 + - - - 2944 + - 256 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 1 + - 873.813 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 2834.46 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 5 + - 168.969 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 178.305 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 3954.41 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 6 + - 3263.15 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 2851.29 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 13 + - 1168.22 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3669.02 + - - - 448 + - 3584 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 4 + - 1312.06 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 3304.19 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3435.51 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 4133.74 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 6 + - 1745.1 + - - - 3584 + - 2368 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1889.39 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4354.77 + - - - 448 + - 4 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 20 + - 4.29226 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 10 + - 3408.71 + - - - 5056 + - 5056 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2404.96 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 26 + - 70.9441 + - - - 4 + - 1408 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 12.1774 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 14 + - 3925.26 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 2570.26 + - - - 5888 + - 1856 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2049.11 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4390.38 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 2155.66 + - - - 4 + - 4 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 21 + - 0.0286676 + - - - 2944 + - 4288 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2134.89 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 3803.64 + - - - 1024 + - 1024 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 866.144 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3725.14 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4372.9 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 13 + - 260.47 + - - - 5888 + - 4288 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 2264.76 + - - - 64 + - 6784 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 585.735 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3992.08 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4478.82 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 6 + - 1015.04 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 18 + - 3701.94 + - - - 256 + - 256 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 95.8479 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3589.75 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 51.3002 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4544.89 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1747.63 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 27.9046 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 31.9312 + - - - 6784 + - 3584 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2316.02 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 17 + - 2145.24 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 24 + - 28.672 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3364.63 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4476.55 + - - - 4 + - 128 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 1.17197 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4269.62 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 2314.09 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 14 + - 4220.95 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 26 + - 183.585 + - - - 704 + - 448 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 453.801 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3807.34 + - - - 2368 + - 4 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 20 + - 21.4361 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3895.64 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4287.55 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 1927.9 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4029.73 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 6 + - 3801.8 + - - - 6784 + - 1856 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2147.51 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 2959.69 + - - - 128 + - 1408 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 260.722 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4279.73 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 3520.08 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4034.92 + - - - 3584 + - 1408 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1650.46 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 10 + - 3602.35 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 1765.2 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3762.52 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 13 + - 485.773 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 19.9805 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4093.62 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 139.81 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 26 + - 25.0047 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 10 + - 2779.78 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 10 + - 3147.42 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4448.59 + - - - 4 + - 5888 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 53.8336 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4298.85 + - - - 6784 + - 2944 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2288.9 + - - - 4288 + - 64 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 1 + - 374.013 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 11 + - 354.249 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 6 + - 1932.76 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 5 + - 82.957 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 6 + - 2049.21 + - - - 704 + - 256 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 255.864 + - - - 4 + - 6784 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 62.3822 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 4453.78 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 11 + - 1083.06 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4460.72 + - - - 6784 + - 5056 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 2412.2 + - - - 128 + - 256 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 50.607 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 3608.74 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 10 + - 2333.17 + - - - 4 + - 704 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 6.29279 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3919.53 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 2805.59 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3345.29 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 3891.09 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 3841.0 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3679.21 + - - - 4 + - 1856 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 17.1407 + - - - 5056 + - 64 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 1 + - 450.204 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4414.96 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 3354.1 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4308.95 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 6 + - 2213.15 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 23 + - 197.314 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 3458.02 + - - - 1856 + - 6784 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 2166.45 + - - - 1408 + - 1408 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 1265.74 + - - - 3584 + - 2944 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1982.16 + - - - 1856 + - 448 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 1 + - 964.743 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 278.137 + - - - 1408 + - 1856 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 3 + - 1469.15 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 101.606 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 26 + - 68.2667 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 10 + - 3113.41 + - - - 128 + - 5888 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 793.331 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 2241.21 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 24 + - 7.96629 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2855.9 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 6 + - 646.13 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4456.48 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4314.93 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 5 + - 254.889 + - - - 6784 + - 256 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 1367.48 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 14 + - 4163.56 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3653.53 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 23 + - 277.644 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3905.3 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 1652.45 + - - - 1024 + - 2944 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 0 + - 1452.41 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3824.23 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1529.5 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4256.23 + - - - 256 + - 128 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 49.9322 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 23 + - 257.251 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 18 + - 3784.77 + - - - 448 + - 5056 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 3 + - 1384.85 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 1771.4 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4354.88 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 26 + - 0.258586 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4149.36 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4395.04 + - - - 4288 + - 256 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 1 + - 980.662 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 8 + - 2825.48 + - - - 1856 + - 2368 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 1764.62 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 25 + - 78.2549 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4169.52 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4196.45 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 3941.37 + - - - 2368 + - 1408 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 0 + - 1673.87 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 6 + - 511.274 + - - - 3584 + - 128 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 1 + - 617.328 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 24 + - 46.8935 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 1972.32 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 18 + - 4166.15 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 10 + - 2258.17 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4055.05 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 976.068 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 18 + - 3907.96 + - - - 64 + - 1408 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 136.018 + - - - 3584 + - 1856 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1802.99 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 656.492 + - - - 2368 + - 1024 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 1 + - 1443.35 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1011.63 + - - - 5056 + - 1856 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 3 + - 2068.94 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3057.03 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 1988.12 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 1958.09 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3729.29 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 12 + - 2827.75 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 1698.61 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 3081.05 + - - - 1024 + - 256 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 368.568 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 2212.84 + - - - 5056 + - 256 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 1 + - 1105.09 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 4307.17 + - - - 1024 + - 704 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 809.427 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 4089.26 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3964.03 + - - - 5888 + - 1408 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1889.8 + - - - 4 + - 1024 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 9.08968 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 1497.47 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 2887.39 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 14 + - 4313.99 + - - - 128 + - 6784 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 888.908 + - - - 1024 + - 4288 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1607.29 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4430.95 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4252.68 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4440.61 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 0.483019 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 13.5303 + - - - 3584 + - 256 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 1 + - 987.227 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 14 + - 4301.25 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3912.25 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 14.2824 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 16 + - 1083.47 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 2802.5 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 1832.62 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4445.82 + - - - 3584 + - 704 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 1380.18 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 14 + - 3960.92 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 3928.11 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 24 + - 40.6862 + - - - 2944 + - 2944 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 4 + - 2020.32 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 3316.93 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 10 + - 2537.65 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4173.27 + - - - 128 + - 704 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 135.38 + - - - 2368 + - 6784 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2227.32 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 1932.76 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4441.69 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 6 + - 1176.29 + - - - 2368 + - 2368 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 3 + - 1908.91 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4281.09 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 2028.1 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 14 + - 3775.18 + - - - 448 + - 128 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 85.1117 + - - - 1408 + - 704 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 911.478 + - - - 2368 + - 1856 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 3 + - 1764.18 + - - - 5888 + - 1024 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 4 + - 1792.11 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 22 + - 256.1 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 1838.74 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4370.84 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 819.2 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 6 + - 2963.69 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 2056.9 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 13 + - 799.97 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 3430.3 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 26 + - 83.6489 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4444.3 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 15 + - 988.864 + - - - 6784 + - 1408 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 2051.69 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 35.4772 + - - - 448 + - 4288 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 2 + - 1480.56 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4492.91 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 10 + - 2803.87 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 23 + - 134.269 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 2944 + - 1792 + - - 6 + - 3721.65 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 18 + - 3981.68 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 3129.06 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 1106.68 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 18 + - 4021.73 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4307.56 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 2626.56 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 9 + - 2005.7 + - - - 1408 + - 448 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 728.704 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 13 + - 678.473 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 3732.64 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4035.28 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 10 + - 3034.65 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 3625.11 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 24 + - 122.613 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2306.69 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 3392.45 + - - - 5888 + - 64 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 1 + - 519.768 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 14 + - 2709.8 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4325.34 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 6 + - 2427.83 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 1490.22 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4534.05 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 17 + - 2087.38 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 25 + - 88.9804 + - - - 3584 + - 5888 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 2139.28 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4150.99 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 6 + - 3352.28 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 1266.23 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3931.0 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 2301.23 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4183.12 + - - - 5056 + - 2944 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 4 + - 2225.15 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 24 + - 18.6447 + - - - 256 + - 64 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 26.7494 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4295.19 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 14 + - 3312.0 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 7 + - 2780.79 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 2825.6 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3471.1 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 10 + - 2493.68 + - - - 1024 + - 128 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 1 + - 186.912 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4312.34 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 728.178 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 26 + - 15.3121 + - - - 64 + - 4288 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 388.233 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 16 + - 753.597 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4163.76 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4480.35 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 6 + - 2108.9 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4219.49 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 3246.18 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 6784 + - 1792 + - - 14 + - 4540.43 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4088.55 + - - - 3584 + - 64 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 1 + - 319.967 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4199.65 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 2869.86 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 8 + - 2569.23 + - - - 5056 + - 5888 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2436.65 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 14 + - 3172.63 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 13 + - 433.369 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 24 + - 14.8176 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 23 + - 239.083 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 4288 + - 1792 + - - 14 + - 4220.07 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4165.0 + - - - 3584 + - 3584 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 4 + - 2017.09 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4106.91 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 24 + - 103.448 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4209.47 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 8 + - 2297.52 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 4173.01 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 6 + - 3598.39 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 8 + - 2802.21 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 9 + - 2058.01 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 3766.7 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 6 + - 2342.79 + - - - 2944 + - 4 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 20 + - 26.8019 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 1499.26 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 3399.41 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 6 + - 3105.04 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 1900.95 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 13 + - 267.105 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 23 + - 191.447 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4178.89 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 9 + - 1808.54 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 10 + - 3175.71 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 1299.12 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 24 + - 5.82025 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 14 + - 4199.28 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 26 + - 60.1415 + - - - 4288 + - 3584 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 0 + - 2240.67 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 3319.92 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 10 + - 2378.29 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 3958.12 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4533.49 + - - - 4 + - 256 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 20 + - 2.25677 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 3917.77 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 1836.6 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 14 + - 4457.63 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 6 + - 3073.66 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3396.29 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 26 + - 69.3016 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 14 + - 3889.77 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 11 + - 1297.17 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 14 + - 3291.5 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 18 + - 3749.64 + - - - 5056 + - 4288 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2339.69 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 3421.93 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4168.41 + - - - 1856 + - 4 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 20 + - 16.8251 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 14 + - 3703.02 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 4051.52 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4211.71 + - - - 2368 + - 3584 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 2058.06 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 47.943 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 52.6394 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 5 + - 142.948 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 14 + - 4154.15 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4447.42 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 2466.98 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 6 + - 2943.86 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4130.78 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 8 + - 2488.48 + - - - 704 + - 5056 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 0 + - 1731.03 + - - - 256 + - 2944 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 804.982 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 14 + - 4066.5 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 11 + - 521.444 + - - - 2368 + - 448 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 912.571 + - - - 64 + - 3584 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 327.973 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4466.21 + - - - 2368 + - 64 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 1 + - 217.474 + - - - 4288 + - 1408 + - 1 + - 128 + - 4288 + - 4288 + - 4288 + - 128 + - - 4 + - 1854.49 + - - - 5888 + - 4 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 20 + - 53.1503 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 2861.67 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 6 + - 1176.29 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 777.246 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4483.23 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 4207.54 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4421.63 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 2912.71 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 2789.1 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 6 + - 3469.83 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 18 + - 3711.42 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2200.82 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 4071.47 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4272.71 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 246.862 + - - - 64 + - 5888 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 523.833 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 24 + - 7.81253 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 10 + - 2222.79 + - - - 2368 + - 128 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 1 + - 432.619 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 2770.63 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 4407.1 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 14 + - 3801.9 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 14 + - 3955.03 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 6 + - 3800.56 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 2899.89 + - - - 6784 + - 704 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 4 + - 1808.64 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 3895.38 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 14 + - 3749.73 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 3850.02 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 3806.86 + - - - 1408 + - 256 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 505.449 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 4288 + - 256 + - - 14 + - 3583.09 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 448 + - 256 + - - 11 + - 178.851 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 13 + - 784.191 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3400.28 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 2368 + - 768 + - - 6 + - 1971.41 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 3965.04 + - - - 256 + - 4 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 20 + - 2.47121 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 448 + - 768 + - - 6 + - 3393.15 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 9 + - 1602.79 + - - - 1408 + - 2944 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1667.23 + - - - 1024 + - 5056 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 4 + - 1646.22 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 8 + - 2677.23 + - - - 1856 + - 2944 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 1884.97 + - - - 256 + - 448 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 169.125 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 14 + - 3705.11 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 256 + - 768 + - - 14 + - 3600.94 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 2944 + - 256 + - - 6 + - 1677.14 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 4 + - 768 + - - 24 + - 64.9846 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 64 + - 1792 + - - 16 + - 1013.31 + - - - 64 + - 2368 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 218.848 + - - - 1856 + - 4288 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 1990.26 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 3422.2 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 6 + - 3725.08 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 3267.57 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 14 + - 3824.17 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 14 + - 4148.08 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 13 + - 665.6 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3676.17 + - - - 5056 + - 704 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 1751.25 + - - - 5888 + - 5888 + - 1 + - 128 + - 5888 + - 5888 + - 5888 + - 128 + - - 0 + - 2312.49 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 5056 + - 256 + - - 10 + - 3128.3 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 14 + - 4134.28 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 14 + - 4507.56 + - - - 256 + - 1408 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 495.036 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 25 + - 1.64498 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 6 + - 2790.75 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 18 + - 4096.69 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 16 + - 759.445 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 448 + - 1792 + - - 9 + - 1168.26 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3298.79 + - - - 6784 + - 448 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 1497.16 + - - - 1856 + - 1024 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 2 + - 1474.0 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4511.54 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1024 + - 1792 + - - 6 + - 2968.67 + - - - 448 + - 448 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 295.969 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 14 + - 3635.77 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2726.43 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 2913.74 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 10 + - 3065.9 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 18 + - 4020.09 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4397.37 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 2915.15 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 2368 + - 256 + - - 11 + - 831.846 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 9 + - 1522.22 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 387.926 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 1408 + - 256 + - - 14 + - 3371.93 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3584 + - 3328 + - - 14 + - 3852.75 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 5056 + - 768 + - - 14 + - 4404.62 + - - - 1408 + - 2368 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 0 + - 1577.36 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1856 + - 1792 + - - 6 + - 2302.69 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 13 + - 771.012 + - - - 64 + - 5056 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 444.026 + - - - 6784 + - 6784 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 0 + - 2506.43 + - - - 448 + - 1856 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 1 + - 953.678 + - - - 2944 + - 1024 + - 1 + - 128 + - 2944 + - 2944 + - 2944 + - 128 + - - 0 + - 1500.76 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4503.58 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 14 + - 3605.13 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 3689.58 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 14 + - 3359.31 + - - - 704 + - 704 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 653.201 + - - - 1408 + - 128 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 1 + - 257.463 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 5056 + - 1792 + - - 14 + - 4280.89 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 98.3595 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 4264.67 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 14 + - 3619.73 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 3584 + - 768 + - - 14 + - 3742.02 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 704 + - 1792 + - - 13 + - 645.303 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4554.14 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 1408 + - 768 + - - 14 + - 4286.55 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 5056 + - 3328 + - - 14 + - 3949.42 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 1856 + - 768 + - - 6 + - 3040.87 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 8 + - 2484.44 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 128 + - 1792 + - - 6 + - 2436.49 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 6784 + - 3328 + - - 14 + - 4556.72 + - - - 448 + - 2944 + - 1 + - 128 + - 448 + - 448 + - 448 + - 128 + - - 4 + - 1104.27 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 24 + - 135.664 + - - - 128 + - 64 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 1 + - 13.2262 + - - - 1856 + - 256 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 1 + - 638.302 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 64 + - 3328 + - - 9 + - 1668.76 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 1024 + - 256 + - - 11 + - 1269.08 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 4288 + - 768 + - - 6 + - 3324.54 + - - - 64 + - 2944 + - 1 + - 128 + - 64 + - 64 + - 64 + - 128 + - - 1 + - 269.166 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 17 + - 1424.77 + - - - 5056 + - 2368 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 4 + - 2156.26 + - - - 704 + - 6784 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 3 + - 1897.57 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 2944 + - 3328 + - - 14 + - 4408.12 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 6 + - 3113.73 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 6 + - 3208.42 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 1980.24 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 256 + - 1792 + - - 14 + - 3777.28 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 17 + - 1978.71 + - - - 3584 + - 4288 + - 1 + - 128 + - 3584 + - 3584 + - 3584 + - 128 + - - 0 + - 2061.81 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 256 + - 3328 + - - 15 + - 1569.93 + - - - 1408 + - 4 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 20 + - 13.0033 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 1024 + - 768 + - - 14 + - 3569.76 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1408 + - 1792 + - - 6 + - 3289.18 + - - - 5056 + - 6784 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 0 + - 2459.99 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 64 + - 768 + - - 6 + - 2080.65 + - - - 1024 + - 4 + - 1 + - 128 + - 1024 + - 1024 + - 1024 + - 128 + - - 20 + - 9.49806 + - - - 256 + - 1024 + - 1 + - 128 + - 256 + - 256 + - 256 + - 128 + - - 1 + - 377.525 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 5888 + - 3328 + - - 22 + - 302.117 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 6 + - 1966.08 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 1724.12 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 4 + - 256 + - - 23 + - 56.5662 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 6 + - 385.85 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 8 + - 2833.99 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 5888 + - 256 + - - 14 + - 4291.71 + - - - 1856 + - 5056 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 4 + - 2068.94 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4183.09 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 6784 + - 256 + - - 10 + - 3156.62 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4256.21 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 4288 + - 3328 + - - 14 + - 4363.46 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 448 + - 3328 + - - 24 + - 66.5006 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3583.54 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 128 + - 768 + - - 10 + - 2659.99 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 1408 + - 3328 + - - 14 + - 4152.69 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4389.23 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 3584 + - 256 + - - 6 + - 1981.12 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 6784 + - 768 + - - 6 + - 2786.16 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 704 + - 768 + - - 24 + - 36.6806 + - - - 6784 + - 4 + - 1 + - 128 + - 6784 + - 6784 + - 6784 + - 128 + - - 20 + - 61.2383 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 128 + - 256 + - - 6 + - 1775.94 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 2944 + - 768 + - - 6 + - 3320.03 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 704 + - 3328 + - - 6 + - 3808.1 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 1856 + - 256 + - - 6 + - 1224.18 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 5888 + - 768 + - - 14 + - 4433.08 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 14 + - 2913.51 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 3584 + - 1792 + - - 6 + - 3431.07 + - - - 4 + - 64 + - 1 + - 128 + - 4 + - 4 + - 4 + - 128 + - - 21 + - 0.472983 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 3948.3 + - - - 2368 + - 704 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 4 + - 1356.72 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 2368 + - 1792 + - - 14 + - 4348.69 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 128 + - 3328 + - - 9 + - 2017.03 + - - - 704 + - 3584 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 3 + - 1504.1 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 64 + - 256 + - - 11 + - 177.467 + - - - 1408 + - 5888 + - 1 + - 128 + - 1408 + - 1408 + - 1408 + - 128 + - - 4 + - 1931.63 + - - - 1856 + - 3584 + - 1 + - 128 + - 1856 + - 1856 + - 1856 + - 128 + - - 3 + - 1990.85 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 4 + - 3328 + - - 24 + - 211.1 + - - - 704 + - 2368 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 2 + - 1329.01 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 5888 + - 1792 + - - 14 + - 4213.24 + - - - 704 + - 64 + - 1 + - 128 + - 704 + - 704 + - 704 + - 128 + - - 1 + - 66.3198 + - - - 2368 + - 256 + - 1 + - 128 + - 2368 + - 2368 + - 2368 + - 128 + - - 1 + - 724.912 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 2368 + - 3328 + - - 14 + - 3940.44 + - - - 5056 + - 128 + - 1 + - 128 + - 5056 + - 5056 + - 5056 + - 128 + - - 1 + - 767.014 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 4 + - 1792 + - - 26 + - 179.961 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 10 + - 3107.11 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 1856 + - 3328 + - - 24 + - 211.533 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 704 + - 256 + - - 6 + - 2182.47 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 1024 + - 3328 + - - 6 + - 3459.77 +- null diff --git a/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml new file mode 100644 index 000000000..1503da0de --- /dev/null +++ b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml @@ -0,0 +1,19013 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 64 + LSPA: 16 + LSPB: 4 + LVCA: 4 + LVCB: 16 + LVPA: 4 + LVPB: 1 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 4 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 32 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 32 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 4 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x32_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x64x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 64 + LSPA: 32 + LSPB: 4 + LVCA: 8 + LVCB: 64 + LVPA: 32 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 32 + LSPB: 2 + LVCA: 8 + LVCB: 128 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 16 + LSPB: 4 + LVCA: 16 + LVCB: 64 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 9 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x16_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 32 + LSPB: 2 + LVCA: 8 + LVCB: 128 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 10 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 8 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 11 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 12 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 13 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x32x32_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 14 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x128x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 64 + LSPA: 32 + LSPB: 4 + LVCA: 8 + LVCB: 64 + LVPA: 32 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 2048 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 15 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 128 + LSPA: 128 + LSPB: 8 + LVCA: 2 + LVCB: 32 + LVPA: 32 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 16 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x8_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 32 + LSPA: 16 + LSPB: 8 + LVCA: 16 + LVCB: 32 + LVPA: 16 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 17 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x16_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 18 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 19 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU8_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 4 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 64 + LSPA: 32 + LSPB: 4 + LVCA: 8 + LVCB: 64 + LVPA: 32 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 20 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 32 + LSPB: 16 + LVCA: 8 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 21 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 2 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 4 + LSCB: 16 + LSPA: 16 + LSPB: 4 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 22 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT16x16x4_SE_AMAS2_GRVW2_GSU1_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 4 + LSCB: 16 + LSPA: 16 + LSPB: 4 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 23 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT16x16x4_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 24 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 25 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU4_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 26 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU8_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 27 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 28 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 29 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 4288 + - - 10 + - 2978.45 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 2944 + - - 14 + - 3351.31 + - - - 448 + - 2944 + - 1 + - 128 + - 448 + - 448 + - 128 + - 2944 + - - 3 + - 1047.28 + - - - 1024 + - 2368 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 2368 + - - 4 + - 1270.79 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 2944 + - - 14 + - 4391.66 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 704 + - - 8 + - 938.841 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 128 + - - 9 + - 768.705 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 704 + - - 21 + - 1992.91 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1024 + - - 25 + - 18.2044 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 5056 + - - 14 + - 3915.61 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 448 + - - 14 + - 2941.67 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 64 + - - 12 + - 1738.99 + - - - 128 + - 5056 + - 1 + - 128 + - 128 + - 128 + - 128 + - 5056 + - - 2 + - 695.88 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 704 + - - 14 + - 2849.99 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 5056 + - - 14 + - 4258.78 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 256 + - - 10 + - 3059.35 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1856 + - - 6 + - 3115.65 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 4288 + - - 14 + - 4273.47 + - - - 6784 + - 256 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 256 + - - 3 + - 1268.25 + - - - 704 + - 256 + - 1 + - 128 + - 704 + - 704 + - 128 + - 256 + - - 2 + - 261.668 + - - - 4288 + - 4 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 4 + - - 22 + - 39.5439 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 704 + - - 6 + - 3061.04 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 768 + - 2368 + - - 6 + - 2753.26 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1856 + - - 18 + - 4110.42 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 3584 + - - 14 + - 4400.95 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 17 + - 106.998 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 6784 + - - 14 + - 3002.41 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 5056 + - - 6 + - 3570.58 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 5056 + - - 16 + - 4197.09 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1024 + - - 14 + - 3594.01 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 6784 + - - 14 + - 4354.86 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3584 + - - 6 + - 3619.9 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 5056 + - - 14 + - 4282.46 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 128 + - - 21 + - 2379.11 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 3584 + - - 14 + - 4292.05 + - - - 1408 + - 2944 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 2944 + - - 3 + - 1549.95 + - - - 448 + - 3584 + - 1 + - 128 + - 448 + - 448 + - 128 + - 3584 + - - 3 + - 1223.34 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 3584 + - - 14 + - 3468.97 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 2368 + - - 14 + - 4166.69 + - - - 704 + - 3584 + - 1 + - 128 + - 704 + - 704 + - 128 + - 3584 + - - 3 + - 1473.9 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 4288 + - - 14 + - 3919.7 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 2944 + - - 14 + - 3916.51 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3584 + - - 21 + - 2317.16 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 5056 + - - 10 + - 2539.35 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 5888 + - - 14 + - 4367.11 + - - - 5888 + - 704 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 704 + - - 3 + - 1378.85 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 5056 + - - 14 + - 3992.59 + - - - 128 + - 2368 + - 1 + - 128 + - 128 + - 128 + - 128 + - 2368 + - - 2 + - 396.538 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 448 + - - 6 + - 3140.27 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1024 + - - 6 + - 1294.54 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1024 + - - 12 + - 2635.54 + - - - 5056 + - 1024 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 1024 + - - 1 + - 1745.42 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1024 + - - 16 + - 3956.68 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 4 + - - 24 + - 87.2296 + - - - 4288 + - 6784 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 6784 + - - 3 + - 2306.66 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 4 + - - 26 + - 196.122 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 256 + - 4 + - - 29 + - 0.0978968 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 6784 + - - 24 + - 344.27 + - - - 1024 + - 4288 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 4288 + - - 4 + - 1486.24 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 6784 + - - 14 + - 4174.99 + - - - 2368 + - 1856 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 1856 + - - 3 + - 1769.51 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 5056 + - - 14 + - 3691.24 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 2944 + - - 14 + - 4290.09 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 256 + - 5888 + - - 6 + - 2063.07 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 5888 + - - 14 + - 4034.17 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 2944 + - - 14 + - 3846.24 + - - - 1024 + - 256 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 256 + - - 2 + - 360.645 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 128 + - - 6 + - 3176.72 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1408 + - - 10 + - 3344.44 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 704 + - - 6 + - 3326.71 + - - - 3584 + - 6784 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 6784 + - - 4 + - 2006.92 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 3584 + - - 14 + - 4224.57 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 768 + - 256 + - - 6 + - 975.204 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 448 + - - 6 + - 2168.4 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 768 + - 2944 + - - 6 + - 2488.02 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 6784 + - - 14 + - 4303.23 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 6784 + - - 14 + - 4448.94 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 64 + - - 6 + - 2028.13 + - - - 1856 + - 2368 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 2368 + - - 3 + - 1761.97 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 128 + - - 6 + - 2722.04 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 704 + - - 12 + - 2559.39 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 6784 + - - 14 + - 3769.68 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 64 + - - 6 + - 1568.89 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 6784 + - - 14 + - 4388.3 + - - - 64 + - 2368 + - 1 + - 128 + - 64 + - 64 + - 128 + - 2368 + - - 2 + - 218.453 + - - - 1024 + - 3584 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 3584 + - - 4 + - 1310.14 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 256 + - 3584 + - - 25 + - 58.8144 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1024 + - - 17 + - 408.802 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 768 + - 5056 + - - 6 + - 3097.89 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 4 + - - 26 + - 102.98 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1856 + - - 6 + - 2924.99 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1856 + - - 6 + - 2287.84 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 128 + - - 8 + - 270.252 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 4 + - - 24 + - 62.5727 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1856 + - - 14 + - 3832.55 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1024 + - - 14 + - 3492.65 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 448 + - - 9 + - 758.268 + - - - 5888 + - 2368 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 2368 + - - 4 + - 1891.19 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 704 + - - 9 + - 921.046 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1856 + - - 18 + - 4133.48 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 2368 + - - 14 + - 4220.49 + - - - 64 + - 6784 + - 1 + - 128 + - 64 + - 64 + - 128 + - 6784 + - - 2 + - 539.349 + - - - 5888 + - 1408 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 1408 + - - 4 + - 1773.33 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 2368 + - - 6 + - 2234.13 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2944 + - - 6 + - 2064.83 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 5056 + - - 14 + - 4185.97 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 4 + - - 28 + - 49.2591 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 5888 + - - 14 + - 3995.35 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1408 + - - 6 + - 1037.26 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 768 + - 5888 + - - 6 + - 2447.62 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 2368 + - - 18 + - 3975.89 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 448 + - - 11 + - 1152.02 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 5056 + - - 14 + - 3847.8 + - - - 6784 + - 5056 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 5056 + - - 3 + - 2253.43 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 64 + - - 6 + - 2498.33 + - - - 1856 + - 1408 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 1408 + - - 3 + - 1593.44 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 6784 + - - 14 + - 4369.31 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 256 + - 2944 + - - 14 + - 2839.15 + - - - 6784 + - 6784 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 6784 + - - 3 + - 2315.32 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1856 + - - 14 + - 4209.42 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 448 + - - 18 + - 3289.57 + - - - 1024 + - 5888 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 5888 + - - 4 + - 1494.02 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 448 + - - 12 + - 2471.93 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 2368 + - - 14 + - 3705.4 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1856 + - - 6 + - 1319.82 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 256 + - 4 + - - 26 + - 13.8209 + - - - 128 + - 4 + - 1 + - 128 + - 128 + - 128 + - 128 + - 4 + - - 22 + - 1.23004 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 768 + - 4 + - - 26 + - 4.26667 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 6784 + - - 14 + - 4338.11 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 4 + - - 25 + - 41.5211 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 256 + - - 10 + - 2813.25 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 64 + - - 17 + - 564.256 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 256 + - 64 + - - 17 + - 24.4537 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 448 + - - 5 + - 1556.61 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 6784 + - - 14 + - 4257.19 + - - - 448 + - 1024 + - 1 + - 128 + - 448 + - 448 + - 128 + - 1024 + - - 2 + - 573.44 + - - - 64 + - 5056 + - 1 + - 128 + - 64 + - 64 + - 128 + - 5056 + - - 2 + - 414.519 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 6784 + - - 14 + - 4398.8 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1856 + - - 6 + - 2286.37 + - - - 4288 + - 3584 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 3584 + - - 1 + - 2207.28 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 4 + - - 26 + - 14.4991 + - - - 128 + - 1856 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1856 + - - 2 + - 333.137 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1856 + - - 6 + - 714.49 + - - - 2944 + - 5056 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 5056 + - - 3 + - 2157.62 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 4 + - - 26 + - 20.3431 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1408 + - - 7 + - 2863.76 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 4 + - - 26 + - 46.0859 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 704 + - - 9 + - 615.399 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 704 + - - 14 + - 3697.87 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 768 + - 704 + - - 6 + - 2102.61 + - - - 4 + - 3584 + - 1 + - 128 + - 4 + - 4 + - 128 + - 3584 + - - 22 + - 31.3787 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 64 + - - 6 + - 1791.77 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 4288 + - - 14 + - 3981.13 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 256 + - - 5 + - 1674.63 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 128 + - - 6 + - 1022.55 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 256 + - 4288 + - - 6 + - 1715.2 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 704 + - - 14 + - 2940.81 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 768 + - 128 + - - 17 + - 287.019 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 5056 + - - 14 + - 4299.56 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1024 + - - 14 + - 3900.87 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 4 + - - 27 + - 65.4216 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 2944 + - - 18 + - 4067.43 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1408 + - - 6 + - 767.591 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 768 + - 5056 + - - 6 + - 2145.31 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 2944 + - - 10 + - 3417.46 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 5056 + - - 14 + - 4160.01 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 256 + - - 6 + - 2633.85 + - - - 4 + - 704 + - 1 + - 128 + - 4 + - 4 + - 128 + - 704 + - - 22 + - 6.16366 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1024 + - - 29 + - 47.6048 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 3584 + - - 6 + - 3262.24 + - - - 1856 + - 128 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 2 + - 331.973 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 4288 + - - 14 + - 4142.12 + - - - 5888 + - 256 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 256 + - - 0 + - 1058.24 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 768 + - 6784 + - - 14 + - 4192.48 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1024 + - - 16 + - 3262.03 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 64 + - - 11 + - 1539.49 + - - - 1856 + - 256 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 256 + - - 2 + - 604.307 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 1782.74 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1024 + - - 14 + - 3782.89 + - - - 448 + - 448 + - 1 + - 128 + - 448 + - 448 + - 128 + - 448 + - - 2 + - 283.681 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 5056 + - - 16 + - 4242.85 + - - - 4 + - 256 + - 1 + - 128 + - 4 + - 4 + - 128 + - 256 + - - 22 + - 2.263 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 4 + - - 25 + - 135.325 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1408 + - - 6 + - 2150.47 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 6784 + - - 14 + - 4463.66 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 2368 + - - 16 + - 3772.83 + - - - 4 + - 64 + - 1 + - 128 + - 4 + - 4 + - 128 + - 64 + - - 23 + - 0.56497 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 256 + - - 6 + - 1745.2 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1408 + - - 26 + - 179.672 + - - - 4288 + - 256 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 256 + - - 3 + - 855.928 + - - - 2944 + - 1856 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 1856 + - - 1 + - 1723.68 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1856 + - - 14 + - 4146.18 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 768 + - 2368 + - - 6 + - 2026.32 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 6784 + - - 24 + - 295.215 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1856 + - - 14 + - 3984.73 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 5056 + - - 14 + - 4365.93 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 4288 + - - 14 + - 4161.65 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 64 + - - 9 + - 988.049 + - - - 5056 + - 4288 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 4288 + - - 3 + - 2187.57 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 128 + - - 6 + - 1705.21 + - - - 2944 + - 6784 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 6784 + - - 3 + - 2142.93 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 2368 + - - 16 + - 3716.22 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 256 + - 5056 + - - 6 + - 1593.03 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 3584 + - - 14 + - 4394.05 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 128 + - - 12 + - 1222.83 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 768 + - 5888 + - - 25 + - 190.963 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1024 + - - 14 + - 3210.16 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 128 + - - 6 + - 2489.74 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 448 + - - 6 + - 3238.45 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 2368 + - - 14 + - 4051.23 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 768 + - 4288 + - - 12 + - 1987.59 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 2944 + - - 14 + - 4136.75 + - - - 6784 + - 4 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 4 + - - 22 + - 62.8336 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1856 + - - 16 + - 3650.86 + - - - 2368 + - 448 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 448 + - - 3 + - 851.245 + - - - 1024 + - 64 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 64 + - - 2 + - 94.2117 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 128 + - - 5 + - 1056.81 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 2368 + - - 16 + - 3908.77 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1024 + - - 16 + - 3429.59 + - - - 256 + - 128 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 2 + - 47.5329 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 64 + - - 12 + - 2102.3 + - - - 5056 + - 3584 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 3584 + - - 3 + - 2200.45 + - - - 128 + - 256 + - 1 + - 128 + - 128 + - 128 + - 128 + - 256 + - - 2 + - 48.3215 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 6784 + - - 14 + - 4236.26 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 3584 + - - 14 + - 4061.33 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 256 + - - 10 + - 2826.33 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 6784 + - - 14 + - 3947.7 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 64 + - - 21 + - 2101.37 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1408 + - - 16 + - 4056.44 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 5888 + - - 14 + - 4451.22 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 5888 + - - 14 + - 3722.55 + - - - 4288 + - 4288 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 4288 + - - 1 + - 2208.98 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 64 + - - 6 + - 3174.13 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 2368 + - - 14 + - 3544.36 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 128 + - - 6 + - 3345.07 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 2944 + - - 14 + - 4306.35 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 448 + - - 6 + - 2746.57 + - - - 1408 + - 704 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 704 + - - 2 + - 790.22 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 5056 + - - 16 + - 3949.63 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 704 + - - 14 + - 3156.71 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 448 + - - 18 + - 3995.45 + - - - 2944 + - 2944 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 2944 + - - 3 + - 1963.95 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 64 + - - 26 + - 7.87692 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 3584 + - - 14 + - 4358.45 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 4 + - - 26 + - 180.642 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 4288 + - - 14 + - 4289.98 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 768 + - 5888 + - - 6 + - 2647.34 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 5888 + - - 14 + - 3898.41 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 2944 + - - 14 + - 3617.92 + - - - 2944 + - 4288 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 4288 + - - 3 + - 2052.87 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1024 + - - 14 + - 4163.13 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1408 + - - 6 + - 2610.65 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 5056 + - - 16 + - 4025.78 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 1408 + - - 14 + - 3617.59 + - - - 1856 + - 1024 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 1024 + - - 3 + - 1466.89 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 704 + - - 26 + - 98.277 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 2368 + - - 14 + - 3583.69 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 768 + - 4288 + - - 6 + - 3210.73 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 2368 + - - 18 + - 3920.2 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 704 + - - 6 + - 3214.41 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1024 + - - 14 + - 3867.15 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1408 + - - 11 + - 1350.38 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 128 + - - 21 + - 1407.48 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 256 + - 128 + - - 25 + - 3.35051 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 448 + - - 6 + - 3403.06 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1856 + - - 18 + - 3880.26 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 4288 + - - 14 + - 4149.39 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 3584 + - - 14 + - 4199.39 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1408 + - - 14 + - 3521.01 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1024 + - - 12 + - 2821.12 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 448 + - - 14 + - 3517.53 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 6784 + - - 14 + - 3964.46 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 4 + - - 26 + - 10.7899 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 2944 + - - 6 + - 3267.55 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1856 + - - 14 + - 4054.97 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 6784 + - - 14 + - 4310.4 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 6784 + - - 6 + - 3294.01 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 256 + - - 12 + - 2214.46 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 448 + - - 6 + - 3440.14 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 5888 + - - 14 + - 4101.95 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 256 + - - 29 + - 27.9386 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 64 + - - 19 + - 152.283 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 2368 + - - 14 + - 4141.82 + - - - 1024 + - 6784 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 6784 + - - 4 + - 1629.04 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 256 + - 704 + - - 6 + - 1564.07 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1856 + - - 26 + - 225.925 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 5056 + - - 14 + - 4363.54 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 256 + - 3584 + - - 6 + - 1241.97 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 3584 + - - 16 + - 3794.12 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 4288 + - - 14 + - 3830.08 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3584 + - - 6 + - 3422.54 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 256 + - 4 + - - 25 + - 1.75418 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 6784 + - - 14 + - 4470.8 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1856 + - - 14 + - 3826.95 + - - - 256 + - 5056 + - 1 + - 128 + - 256 + - 256 + - 128 + - 5056 + - - 4 + - 759.42 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 768 + - 704 + - - 26 + - 35.6174 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1856 + - - 14 + - 4135.08 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 256 + - - 8 + - 260.84 + - - - 704 + - 6784 + - 1 + - 128 + - 704 + - 704 + - 128 + - 6784 + - - 4 + - 1843.99 + - - - 1856 + - 2944 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 2944 + - - 3 + - 1884.97 + - - - 3584 + - 1408 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 1408 + - - 4 + - 1501.31 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 5056 + - - 14 + - 4250.78 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 2944 + - - 14 + - 4350.29 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 64 + - - 6 + - 2852.9 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 128 + - - 6 + - 1319.82 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 4288 + - - 25 + - 255.626 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 256 + - 3584 + - - 14 + - 3401.03 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 704 + - - 6 + - 2730.4 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 64 + - - 9 + - 448.814 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 2944 + - - 16 + - 2748.4 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 64 + - - 5 + - 1522.32 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 128 + - - 11 + - 1468.91 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 5888 + - - 14 + - 4414.82 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 256 + - 6784 + - - 6 + - 2340.97 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 5888 + - - 6 + - 2864.81 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 64 + - - 6 + - 1043.13 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 2368 + - - 14 + - 4036.35 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1408 + - - 14 + - 4198.29 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 6784 + - - 6 + - 3322.62 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 448 + - - 6 + - 3512.62 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 768 + - 4 + - - 26 + - 36.0448 + - - - 5888 + - 5888 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 5888 + - - 1 + - 1910.58 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 704 + - - 12 + - 1673.72 + - - - 4288 + - 128 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 2 + - 649.543 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 256 + - 128 + - - 17 + - 369.217 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 3584 + - - 14 + - 4286.86 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1856 + - - 16 + - 3894.58 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 5888 + - - 14 + - 4374.04 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 256 + - 704 + - - 6 + - 550.302 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1408 + - - 14 + - 3715.62 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 3584 + - - 14 + - 4359.77 + - - - 1408 + - 1856 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 1856 + - - 3 + - 1461.45 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1408 + - - 14 + - 3992.11 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1024 + - - 6 + - 1900.33 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 128 + - - 6 + - 2171.03 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 5888 + - - 14 + - 4297.72 + - - - 256 + - 3584 + - 1 + - 128 + - 256 + - 256 + - 128 + - 3584 + - - 2 + - 749.365 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 2368 + - - 10 + - 3093.07 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 2368 + - - 6 + - 3475.42 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1856 + - - 6 + - 3232.7 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 2368 + - - 14 + - 3634.65 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 2944 + - - 16 + - 3411.77 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 256 + - 2368 + - - 6 + - 1494.5 + - - - 6784 + - 64 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 64 + - - 2 + - 554.415 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 128 + - - 6 + - 2934.25 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 128 + - - 6 + - 2977.7 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 768 + - 6784 + - - 6 + - 2997.55 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 5888 + - - 6 + - 2761.22 + - - - 5888 + - 64 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 64 + - - 2 + - 477.758 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 256 + - 6784 + - - 24 + - 100.971 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 768 + - 448 + - - 6 + - 1645.4 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 768 + - 128 + - - 8 + - 78.2519 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 5888 + - - 14 + - 4216.99 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 3584 + - - 14 + - 3980.94 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 4288 + - - 25 + - 327.455 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1856 + - - 5 + - 1214.41 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 6784 + - - 14 + - 4096.48 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 5056 + - - 14 + - 4202.94 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 768 + - 3584 + - - 14 + - 3732.22 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1856 + - - 12 + - 2106.7 + - - - 1024 + - 4 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 4 + - - 22 + - 9.79621 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1024 + - - 14 + - 3984.54 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 2368 + - - 14 + - 4110.62 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1408 + - - 6 + - 2690.22 + - - - 4 + - 448 + - 1 + - 128 + - 4 + - 4 + - 128 + - 448 + - - 23 + - 4.027 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 2944 + - - 6 + - 3444.89 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 3584 + - - 18 + - 4051.1 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 256 + - - 6 + - 2014.26 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 5056 + - - 14 + - 4173.16 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 4 + - - 29 + - 65.3308 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 2368 + - - 14 + - 4220.1 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 6784 + - - 10 + - 3468.55 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 448 + - - 6 + - 3355.71 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 448 + - - 9 + - 663.379 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 4288 + - - 14 + - 4311.37 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 4 + - - 25 + - 24.9964 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 2368 + - - 16 + - 3961.51 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 5056 + - - 25 + - 343.396 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 2064.83 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 768 + - 4 + - - 26 + - 0.268531 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 256 + - 5056 + - - 6 + - 1997.05 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 704 + - - 10 + - 2489.62 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 5056 + - - 14 + - 4027.44 + - - - 1856 + - 3584 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 3584 + - - 3 + - 1996.07 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 3584 + - - 6 + - 2507.27 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 256 + - 3584 + - - 14 + - 2990.7 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 2944 + - - 14 + - 4336.07 + - - - 448 + - 1856 + - 1 + - 128 + - 448 + - 448 + - 128 + - 1856 + - - 2 + - 905.021 + - - - 64 + - 2944 + - 1 + - 128 + - 64 + - 64 + - 128 + - 2944 + - - 3 + - 210.227 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 6784 + - - 14 + - 3757.94 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 4288 + - - 14 + - 4224.84 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 704 + - - 16 + - 4020.86 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 4 + - - 26 + - 154.122 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 17 + - 211.406 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 128 + - - 26 + - 14.5359 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 448 + - - 6 + - 2922.84 + - - - 5888 + - 5056 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 5056 + - - 1 + - 1902.68 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 704 + - - 14 + - 3545.39 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 2944 + - - 6 + - 3225.35 + - - - 4 + - 4288 + - 1 + - 128 + - 4 + - 4 + - 128 + - 4288 + - - 22 + - 37.7489 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1856 + - - 6 + - 3852.02 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 768 + - 2368 + - - 6 + - 1210.4 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 704 + - - 18 + - 3344.2 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1024 + - - 14 + - 1959.96 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 768 + - 2944 + - - 6 + - 3160.65 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 128 + - - 19 + - 230.729 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1408 + - - 6 + - 3388.3 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 5056 + - - 25 + - 271.757 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 2368 + - - 26 + - 181.036 + - - - 2368 + - 5888 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 5888 + - - 3 + - 2147.11 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 6784 + - - 14 + - 4334.69 + - - - 128 + - 1408 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1408 + - - 2 + - 259.782 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 768 + - 64 + - - 8 + - 41.6984 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 256 + - 5888 + - - 14 + - 3543.68 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 256 + - - 6 + - 3388.51 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 128 + - - 9 + - 1160.83 + - - - 3584 + - 704 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 704 + - - 4 + - 1246.76 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 4288 + - - 14 + - 4078.8 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 448 + - - 6 + - 1990.64 + - - - 64 + - 704 + - 1 + - 128 + - 64 + - 64 + - 128 + - 704 + - - 2 + - 63.9659 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 4 + - - 27 + - 77.5981 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 768 + - 5888 + - - 14 + - 3880.34 + - - - 704 + - 128 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 2 + - 131.191 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 2368 + - - 16 + - 3087.17 + - - - 2368 + - 1024 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 1024 + - - 3 + - 1463.5 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 256 + - 64 + - - 17 + - 184.608 + - - - 256 + - 64 + - 1 + - 128 + - 256 + - 256 + - 128 + - 64 + - - 2 + - 23.5741 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 256 + - - 6 + - 2987.8 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1408 + - - 16 + - 3596.38 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1024 + - - 6 + - 1070.89 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 768 + - 448 + - - 6 + - 974.34 + - - - 3584 + - 1856 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 1856 + - - 4 + - 1677.39 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 256 + - - 14 + - 2849.45 + - - - 1024 + - 128 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 2 + - 191.521 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 704 + - - 14 + - 3627.59 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1408 + - - 14 + - 4103.69 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 4288 + - - 14 + - 4185.89 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1408 + - - 6 + - 2401.32 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 2944 + - - 21 + - 1943.98 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 5888 + - - 25 + - 287.816 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 5888 + - - 14 + - 3349.44 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 256 + - - 10 + - 3246.57 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1024 + - - 16 + - 3786.81 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 768 + - 3584 + - - 14 + - 3378.8 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 4 + - - 26 + - 92.2115 + - - - 6784 + - 1024 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 1024 + - - 3 + - 1820.63 + - - - 1408 + - 448 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 448 + - - 2 + - 725.56 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 5888 + - - 14 + - 4469.75 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1408 + - - 14 + - 3898.2 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 4 + - - 27 + - 98.3411 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 4288 + - - 14 + - 3112.74 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1024 + - - 6 + - 2181.29 + - - - 4288 + - 704 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 704 + - - 1 + - 1473.01 + - - - 2944 + - 1024 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 1024 + - - 1 + - 1425.79 + - - - 256 + - 1024 + - 1 + - 128 + - 256 + - 256 + - 128 + - 1024 + - - 2 + - 317.991 + - - - 5056 + - 704 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 704 + - - 1 + - 1705.62 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 4288 + - - 14 + - 4246.58 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 6 + - 2185.89 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1856 + - - 14 + - 3794.9 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 256 + - 64 + - - 17 + - 53.2813 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1856 + - - 6 + - 3632.06 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1024 + - - 14 + - 3677.22 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 2368 + - - 18 + - 4015.85 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 1408 + - - 18 + - 4115.4 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 6784 + - - 14 + - 4453.3 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 256 + - - 6 + - 2669.1 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 2944 + - - 6 + - 2941.68 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1408 + - - 12 + - 2300.73 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 1408 + - - 16 + - 3786.73 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 4 + - - 24 + - 141.819 + - - - 5056 + - 5888 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 5888 + - - 3 + - 2289.54 + - - - 256 + - 448 + - 1 + - 128 + - 256 + - 256 + - 128 + - 448 + - - 2 + - 167.428 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 448 + - - 6 + - 2718.53 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 768 + - 448 + - - 6 + - 2098.24 + - - - 256 + - 4288 + - 1 + - 128 + - 256 + - 256 + - 128 + - 4288 + - - 4 + - 726.371 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 128 + - - 12 + - 2365.88 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 448 + - - 6 + - 2239.29 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 768 + - 5056 + - - 12 + - 2305.31 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1024 + - - 16 + - 3332.59 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 768 + - 5056 + - - 6 + - 3322.36 + - - - 2368 + - 128 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 2 + - 404.813 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 128 + - - 6 + - 2845.93 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 5888 + - - 14 + - 3288.61 + - - - 704 + - 704 + - 1 + - 128 + - 704 + - 704 + - 128 + - 704 + - - 2 + - 591.78 + - - - 6784 + - 1408 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 1408 + - - 3 + - 2008.81 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 4 + - - 29 + - 48.7256 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1408 + - - 6 + - 3624.3 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 64 + - - 26 + - 10.6924 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 704 + - - 6 + - 2796.76 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1856 + - - 14 + - 4161.04 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1856 + - - 21 + - 2465.16 + - - - 64 + - 128 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 2 + - 11.5686 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 6784 + - - 14 + - 3378.9 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1856 + - - 5 + - 1698.66 + - - - 5888 + - 3584 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 3584 + - - 3 + - 1850.8 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 3584 + - - 16 + - 3197.4 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3584 + - - 14 + - 3583.58 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 4288 + - - 14 + - 4194.22 + - - - 2368 + - 1408 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 1408 + - - 1 + - 1675.45 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 5888 + - - 14 + - 4289.0 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3584 + - - 14 + - 4065.82 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 4 + - - 29 + - 194.699 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 5888 + - - 14 + - 4298.63 + - - - 1856 + - 64 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 64 + - - 2 + - 170.147 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1408 + - - 14 + - 3751.5 + - - - 2944 + - 256 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 256 + - - 2 + - 831.629 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 128 + - - 6 + - 1101.83 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1024 + - - 5 + - 748.601 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 1302.58 + - - - 448 + - 256 + - 1 + - 128 + - 448 + - 448 + - 128 + - 256 + - - 2 + - 168.814 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1024 + - - 7 + - 3177.17 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 3584 + - - 14 + - 4218.1 + - - - 128 + - 704 + - 1 + - 128 + - 128 + - 128 + - 128 + - 704 + - - 2 + - 130.597 + - - - 1024 + - 2944 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 2944 + - - 4 + - 1234.25 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 3584 + - - 25 + - 228.887 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 2944 + - - 14 + - 4131.78 + - - - 2368 + - 5056 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 5056 + - - 3 + - 2100.23 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 2944 + - - 14 + - 4079.25 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 64 + - - 20 + - 2120.43 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 6784 + - - 14 + - 4327.63 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 768 + - 4288 + - - 6 + - 1820.7 + - - - 1856 + - 704 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 704 + - - 3 + - 1047.92 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 2368 + - - 6 + - 3706.33 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 128 + - - 10 + - 2817.47 + - - - 704 + - 2944 + - 1 + - 128 + - 704 + - 704 + - 128 + - 2944 + - - 3 + - 1227.74 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1024 + - - 14 + - 2614.01 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 5888 + - - 14 + - 4324.17 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 2368 + - - 6 + - 2806.32 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1856 + - - 14 + - 3709.73 + - - - 4 + - 6784 + - 1 + - 128 + - 4 + - 4 + - 128 + - 6784 + - - 22 + - 60.1357 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 448 + - - 6 + - 2739.19 + - - - 2944 + - 4 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 4 + - - 22 + - 27.0715 + - - - 256 + - 4 + - 1 + - 128 + - 256 + - 256 + - 128 + - 4 + - - 22 + - 2.47869 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 1408 + - - 6 + - 3748.66 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 5056 + - - 14 + - 4378.79 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 2368 + - - 6 + - 2732.68 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 128 + - - 9 + - 406.667 + - - - 64 + - 1408 + - 1 + - 128 + - 64 + - 64 + - 128 + - 1408 + - - 2 + - 134.37 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 4 + - - 25 + - 32.1908 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 128 + - - 9 + - 689.853 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 448 + - - 21 + - 2173.73 + - - - 1408 + - 64 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 64 + - - 2 + - 129.541 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 768 + - 2944 + - - 12 + - 1461.06 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 5888 + - - 14 + - 4378.32 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 128 + - - 7 + - 2928.23 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 448 + - - 6 + - 3147.23 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 6784 + - - 14 + - 4541.16 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 14 + - 2735.93 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 6784 + - - 18 + - 4118.04 + - - - 704 + - 1408 + - 1 + - 128 + - 704 + - 704 + - 128 + - 1408 + - - 4 + - 804.653 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 64 + - - 6 + - 998.534 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 4 + - - 25 + - 65.7507 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 64 + - - 6 + - 2774.83 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 4288 + - - 18 + - 4146.53 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 4 + - - 25 + - 150.511 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 4288 + - - 10 + - 2639.32 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 256 + - - 6 + - 3242.17 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 5056 + - - 6 + - 3496.28 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 128 + - - 12 + - 1668.88 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 4288 + - - 6 + - 2032.16 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 64 + - - 19 + - 414.331 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1408 + - - 14 + - 4348.82 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3584 + - - 14 + - 4280.57 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1856 + - - 16 + - 3823.12 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 5888 + - - 14 + - 3317.37 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 2944 + - - 14 + - 3988.33 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 768 + - 4288 + - - 14 + - 3971.96 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 768 + - 3584 + - - 25 + - 139.58 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 256 + - - 14 + - 3765.58 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 64 + - - 19 + - 239.991 + - - - 64 + - 4 + - 1 + - 128 + - 64 + - 64 + - 128 + - 4 + - - 22 + - 0.605923 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1856 + - - 18 + - 4034.94 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 5056 + - - 6 + - 3304.44 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 768 + - 64 + - - 8 + - 150.226 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 768 + - 448 + - - 17 + - 496.843 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 25 + - 5.71867 + - - - 64 + - 64 + - 1 + - 128 + - 64 + - 64 + - 128 + - 64 + - - 2 + - 5.72867 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1856 + - - 6 + - 3416.44 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 6784 + - - 6 + - 3166.9 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 64 + - - 6 + - 1361.52 + - - - 5888 + - 448 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 448 + - - 3 + - 1173.34 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 768 + - 2368 + - - 12 + - 2206.06 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 4 + - - 26 + - 28.5294 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 768 + - 704 + - - 17 + - 394.291 + - - - 6784 + - 128 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 2 + - 942.58 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 5056 + - - 14 + - 4217.11 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1408 + - - 14 + - 3985.6 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 1856 + - - 18 + - 2939.46 + - - - 2944 + - 1408 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 1408 + - - 3 + - 1564.95 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 256 + - - 5 + - 2076.24 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 768 + - 5056 + - - 16 + - 3760.79 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 14 + - 3004.03 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3584 + - - 16 + - 4385.76 + - - - 3584 + - 2944 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 2944 + - - 4 + - 1806.54 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 256 + - - 5 + - 1222.76 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 448 + - - 9 + - 1157.45 + - - - 704 + - 4288 + - 1 + - 128 + - 704 + - 704 + - 128 + - 4288 + - - 1 + - 1427.31 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 5888 + - - 6 + - 2815.56 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 2944 + - - 14 + - 3733.63 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 64 + - - 12 + - 1488.72 + - - - 128 + - 4288 + - 1 + - 128 + - 128 + - 128 + - 128 + - 4288 + - - 2 + - 607.739 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 704 + - - 12 + - 2888.03 + - - - 64 + - 4288 + - 1 + - 128 + - 64 + - 64 + - 128 + - 4288 + - - 2 + - 357.566 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 256 + - 2368 + - - 14 + - 2976.91 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 5888 + - - 14 + - 4387.75 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 704 + - - 14 + - 3790.63 + - - - 64 + - 1856 + - 1 + - 128 + - 64 + - 64 + - 128 + - 1856 + - - 2 + - 180.317 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1856 + - - 14 + - 4007.93 + - - - 4288 + - 2944 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 2944 + - - 3 + - 2146.46 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 2944 + - - 14 + - 3703.84 + - - - 1856 + - 4 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 4 + - - 22 + - 17.0668 + - - - 64 + - 1024 + - 1 + - 128 + - 64 + - 64 + - 128 + - 1024 + - - 2 + - 95.4118 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 256 + - 5056 + - - 27 + - 76.5879 + - - - 5056 + - 2944 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 2944 + - - 1 + - 2165.47 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 6784 + - - 14 + - 4285.9 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1408 + - - 6 + - 1467.47 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 768 + - 5888 + - - 14 + - 3654.13 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1408 + - - 6 + - 3679.57 + - - - 256 + - 1408 + - 1 + - 128 + - 256 + - 256 + - 128 + - 1408 + - - 2 + - 383.201 + - - - 6784 + - 4288 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 4288 + - - 3 + - 2247.95 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1856 + - - 14 + - 4013.58 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 704 + - - 6 + - 3279.17 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 448 + - - 6 + - 3561.0 + - - - 256 + - 256 + - 1 + - 128 + - 256 + - 256 + - 128 + - 256 + - - 2 + - 92.6304 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 4 + - - 25 + - 58.9656 + - - - 5056 + - 1856 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 1856 + - - 1 + - 2074.09 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3584 + - - 18 + - 3979.75 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1408 + - - 14 + - 3804.96 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 6784 + - - 14 + - 4304.48 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 768 + - 2368 + - - 14 + - 3447.63 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 5056 + - - 16 + - 4047.07 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 3584 + - - 14 + - 4235.04 + - - - 448 + - 1408 + - 1 + - 128 + - 448 + - 448 + - 128 + - 1408 + - - 2 + - 729.23 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 2944 + - - 16 + - 3360.79 + - - - 4 + - 1408 + - 1 + - 128 + - 4 + - 4 + - 128 + - 1408 + - - 22 + - 12.782 + - - - 128 + - 2944 + - 1 + - 128 + - 128 + - 128 + - 128 + - 2944 + - - 2 + - 455.042 + - - - 1408 + - 6784 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 6784 + - - 3 + - 1970.73 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 704 + - - 14 + - 3696.9 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 2368 + - - 18 + - 3972.14 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1856 + - - 14 + - 3600.7 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 1408 + - - 14 + - 3637.74 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3584 + - - 25 + - 299.087 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 3584 + - - 14 + - 4360.31 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1856 + - - 14 + - 3908.18 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 5056 + - - 18 + - 4036.73 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 128 + - - 6 + - 2030.33 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1856 + - - 18 + - 3665.17 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 256 + - 4288 + - - 25 + - 67.5109 + - - - 2944 + - 2368 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 2368 + - - 3 + - 1832.77 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 64 + - - 9 + - 674.254 + - - - 2368 + - 2944 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 2944 + - - 1 + - 1930.13 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3584 + - - 14 + - 4319.35 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 768 + - 64 + - - 26 + - 4.2965 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 64 + - - 19 + - 131.375 + - - - 3584 + - 5888 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 5888 + - - 4 + - 1885.32 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 704 + - - 14 + - 3708.99 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 6 + - 2307.19 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1856 + - - 25 + - 32.3222 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 6784 + - - 14 + - 4449.05 + - - - 3584 + - 448 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 448 + - - 4 + - 1026.78 + - - - 448 + - 128 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 2 + - 84.8755 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 3584 + - - 14 + - 3747.81 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 5056 + - - 14 + - 4028.67 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 2368 + - - 5 + - 1765.49 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 4 + - - 26 + - 178.447 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 768 + - 4288 + - - 6 + - 2643.8 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 64 + - - 6 + - 2140.87 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 768 + - 4 + - - 26 + - 24.8601 + - - - 128 + - 448 + - 1 + - 128 + - 128 + - 128 + - 128 + - 448 + - - 2 + - 84.3294 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1856 + - - 14 + - 3723.24 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 2368 + - - 14 + - 4153.7 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 256 + - 2368 + - - 6 + - 2260.16 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 2944 + - - 14 + - 4282.68 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 448 + - - 6 + - 3531.03 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 2944 + - - 26 + - 277.24 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1408 + - - 14 + - 3662.35 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 256 + - 2944 + - - 6 + - 1863.77 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 64 + - - 5 + - 1778.13 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 17 + - 409.6 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 5056 + - - 14 + - 4267.29 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1024 + - - 14 + - 3157.62 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 5888 + - - 14 + - 4190.54 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3584 + - - 18 + - 4076.96 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 448 + - - 26 + - 67.0388 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1024 + - - 14 + - 3445.75 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 64 + - - 9 + - 655.36 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 256 + - 3584 + - - 6 + - 2178.05 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 768 + - 4 + - - 26 + - 15.147 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1408 + - - 6 + - 3070.61 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 4 + - - 26 + - 7.70753 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 4 + - - 26 + - 119.125 + - - - 5056 + - 6784 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 6784 + - - 1 + - 2331.35 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 5888 + - - 14 + - 3929.28 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 448 + - - 16 + - 3378.1 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 3584 + - - 14 + - 4278.18 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 256 + - - 6 + - 3105.04 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 5056 + - - 14 + - 4150.22 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 6784 + - - 14 + - 4317.69 + - - - 6784 + - 2944 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 2944 + - - 3 + - 2195.79 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 704 + - - 18 + - 3912.39 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 5888 + - - 14 + - 4288.37 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 1892.55 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 256 + - 1024 + - - 6 + - 776.723 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 2368 + - - 12 + - 1403.96 + - - - 3584 + - 2368 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 2368 + - - 4 + - 1789.31 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 2368 + - - 26 + - 258.894 + - - - 448 + - 2368 + - 1 + - 128 + - 448 + - 448 + - 128 + - 2368 + - - 4 + - 826.781 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 768 + - 704 + - - 6 + - 767.591 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1024 + - - 16 + - 3385.73 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 2944 + - - 16 + - 3926.46 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 128 + - - 6 + - 2391.33 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 2368 + - - 14 + - 3578.14 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 4 + - - 26 + - 167.805 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 2368 + - - 14 + - 4243.79 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 256 + - - 9 + - 746.522 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 5056 + - - 16 + - 4350.66 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1408 + - - 5 + - 998.767 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 2944 + - - 14 + - 4353.0 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 4288 + - - 14 + - 4033.43 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 1856 + - - 14 + - 3770.5 + - - - 2368 + - 3584 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 3584 + - - 3 + - 2050.91 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 128 + - - 6 + - 2650.25 + - - - 448 + - 704 + - 1 + - 128 + - 448 + - 448 + - 128 + - 704 + - - 2 + - 416.016 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 64 + - - 6 + - 2484.51 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 768 + - 3584 + - - 6 + - 2926.26 + - - - 1024 + - 1024 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 1024 + - - 4 + - 764.338 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3584 + - - 14 + - 4366.79 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 256 + - 2944 + - - 25 + - 49.1948 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 2944 + - - 26 + - 199.836 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 768 + - 1024 + - - 6 + - 2983.75 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 3584 + - - 14 + - 3935.22 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 5888 + - - 14 + - 4415.85 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 4288 + - - 14 + - 4290.87 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 768 + - 64 + - - 17 + - 250.913 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 2944 + - - 14 + - 4249.66 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 256 + - - 6 + - 2935.9 + - - - 128 + - 5888 + - 1 + - 128 + - 128 + - 128 + - 128 + - 5888 + - - 2 + - 779.484 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 2944 + - - 16 + - 4246.43 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 6784 + - - 14 + - 4377.96 + - - - 5888 + - 4288 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 4288 + - - 4 + - 2015.49 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 704 + - - 14 + - 3455.36 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 256 + - 4288 + - - 14 + - 2873.29 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 3584 + - - 14 + - 3825.52 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 768 + - 2944 + - - 6 + - 2668.82 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 5888 + - - 14 + - 4321.94 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 256 + - 1408 + - - 6 + - 1969.28 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 2944 + - - 14 + - 4291.77 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 5888 + - - 14 + - 3829.55 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 2944 + - - 14 + - 4208.83 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 5056 + - - 12 + - 2458.71 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 2944 + - - 16 + - 3965.52 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 4288 + - - 14 + - 3760.67 + - - - 256 + - 1856 + - 1 + - 128 + - 256 + - 256 + - 128 + - 1856 + - - 2 + - 468.981 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 128 + - - 5 + - 2018.66 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 768 + - 128 + - - 17 + - 495.948 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 6784 + - - 14 + - 4207.7 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 64 + - - 6 + - 697.447 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 448 + - - 26 + - 46.2985 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1024 + - - 10 + - 2134.51 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 5056 + - - 14 + - 4393.36 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 2944 + - - 14 + - 4170.09 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 704 + - - 6 + - 1042.89 + - - - 2944 + - 64 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 64 + - - 2 + - 262.601 + - - - 704 + - 4 + - 1 + - 128 + - 704 + - 704 + - 128 + - 4 + - - 22 + - 6.84748 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 768 + - 4 + - - 29 + - 7.87692 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 4288 + - - 14 + - 3635.11 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 128 + - - 6 + - 2077.28 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 6784 + - - 14 + - 4472.49 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 5056 + - - 14 + - 4205.98 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 4288 + - - 14 + - 4139.4 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 128 + - - 6 + - 2243.73 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 3584 + - - 14 + - 3844.03 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 2368 + - - 14 + - 3926.62 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 256 + - - 9 + - 494.611 + - - - 3584 + - 4288 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 4288 + - - 4 + - 1896.14 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 4288 + - - 14 + - 3879.42 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 1408 + - - 10 + - 3021.56 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 256 + - 64 + - - 17 + - 294.845 + - - - 4 + - 5888 + - 1 + - 128 + - 4 + - 4 + - 128 + - 5888 + - - 23 + - 51.5506 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 128 + - - 12 + - 2175.6 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1856 + - - 14 + - 3969.94 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 1024 + - - 12 + - 2400.75 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 2368 + - - 6 + - 3846.67 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 768 + - 1024 + - - 12 + - 2607.61 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 4 + - - 24 + - 67.1804 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 5056 + - - 14 + - 3641.35 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 256 + - 4288 + - - 14 + - 3351.84 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 2368 + - - 14 + - 3949.8 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1024 + - - 16 + - 3881.05 + - - - 704 + - 5056 + - 1 + - 128 + - 704 + - 704 + - 128 + - 5056 + - - 1 + - 1679.47 + - - - 1856 + - 1856 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 1856 + - - 1 + - 1725.06 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 2944 + - - 6 + - 2786.74 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1408 + - - 14 + - 3258.78 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 448 + - - 18 + - 3217.97 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 1856 + - - 14 + - 4009.94 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 2368 + - - 16 + - 3550.11 + - - - 2944 + - 128 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 2 + - 483.118 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 768 + - 448 + - - 17 + - 250.684 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 2368 + - - 14 + - 4180.98 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 5056 + - - 14 + - 4215.39 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 448 + - - 18 + - 2750.55 + - - - 448 + - 6784 + - 1 + - 128 + - 448 + - 448 + - 128 + - 6784 + - - 1 + - 1479.4 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 64 + - - 6 + - 1238.21 + - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 448 + - - 18 + - 2830.48 + - - - 1856 + - 448 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 448 + - - 2 + - 900.732 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 128 + - - 6 + - 3042.4 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 4288 + - - 14 + - 4266.67 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 4288 + - - 14 + - 3787.5 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 448 + - - 9 + - 427.03 + - - - 5056 + - 5056 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 5056 + - - 1 + - 2249.91 + - - - 1024 + - 1408 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 1408 + - - 4 + - 954.039 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 5888 + - - 14 + - 4077.8 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 768 + - 128 + - - 8 + - 149.797 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 256 + - 5888 + - - 27 + - 88.3545 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 2944 + - - 14 + - 4345.57 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 6784 + - - 14 + - 3848.24 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 4288 + - - 14 + - 4255.32 + - - - 6784 + - 3584 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 3584 + - - 3 + - 2206.09 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 2368 + - - 14 + - 3841.52 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 5056 + - - 6 + - 2373.37 + - - - 3584 + - 64 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 64 + - - 2 + - 313.945 + - - - 1408 + - 1024 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 1024 + - - 3 + - 1082.02 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 5888 + - - 14 + - 4445.64 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 1024 + - - 11 + - 1028.79 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1408 + - - 12 + - 1653.16 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 14 + - 2456.63 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 256 + - - 14 + - 3541.28 + - - - 2368 + - 64 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 64 + - - 2 + - 211.038 + - - - 128 + - 3584 + - 1 + - 128 + - 128 + - 128 + - 128 + - 3584 + - - 2 + - 553.965 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 256 + - 704 + - - 28 + - 13.4697 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 704 + - - 10 + - 2987.41 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 704 + - - 6 + - 3207.17 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 6784 + - - 14 + - 4357.86 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 256 + - - 6 + - 1935.41 + - - - 1024 + - 704 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 704 + - - 2 + - 708.497 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 64 + - - 6 + - 2089.27 + - - - 4288 + - 64 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 64 + - - 2 + - 365.605 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1024 + - - 14 + - 3788.51 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 768 + - 64 + - - 8 + - 81.243 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 5888 + - - 16 + - 4158.87 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 1408 + - - 6 + - 1771.79 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 704 + - - 5 + - 2175.12 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 1024 + - - 14 + - 3016.17 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 3584 + - - 16 + - 4344.42 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 5056 + - - 14 + - 3972.04 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 256 + - - 14 + - 3150.52 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1024 + - - 12 + - 2072.66 + - - - 5056 + - 2368 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 2368 + - - 3 + - 2044.64 + - - - 5888 + - 4 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 4 + - - 22 + - 54.5348 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1408 + - - 14 + - 3317.19 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 128 + - - 7 + - 2579.92 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 768 + - 5056 + - - 25 + - 172.426 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 704 + - - 14 + - 3331.43 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 704 + - - 11 + - 1417.8 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1408 + - - 26 + - 122.009 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 5056 + - - 14 + - 4336.72 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 64 + - - 12 + - 2238.86 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 448 + - - 6 + - 3465.34 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 256 + - 5056 + - - 14 + - 2973.04 + - - - 2944 + - 3584 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 3584 + - - 3 + - 2035.7 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 128 + - - 6 + - 2026.32 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 256 + - 704 + - - 17 + - 291.271 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 1024 + - - 14 + - 3716.54 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1408 + - - 6 + - 3631.36 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 6784 + - - 14 + - 3900.56 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 448 + - - 18 + - 4074.16 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1024 + - - 6 + - 1726.05 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 256 + - 1408 + - - 25 + - 24.5872 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1024 + - - 12 + - 2566.17 + - - - 1408 + - 1408 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 1408 + - - 3 + - 1123.61 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 768 + - 128 + - - 26 + - 7.81431 + - - - 64 + - 256 + - 1 + - 128 + - 64 + - 64 + - 128 + - 256 + - - 2 + - 23.2397 + - - - 3584 + - 128 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 2 + - 532.272 + - - - 5056 + - 128 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 2 + - 739.621 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1024 + - - 16 + - 2927.74 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 5056 + - - 14 + - 3987.13 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 128 + - - 9 + - 492.62 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 448 + - - 6 + - 1856.99 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 2368 + - - 14 + - 3983.14 + - - - 4 + - 2944 + - 1 + - 128 + - 4 + - 4 + - 128 + - 2944 + - - 22 + - 26.1328 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 5056 + - - 14 + - 3223.25 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 5888 + - - 14 + - 4322.83 + - - - 4288 + - 5056 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 5056 + - - 3 + - 2244.03 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 64 + - - 17 + - 106.563 + - - - 1408 + - 3584 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 3584 + - - 3 + - 1719.35 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 4 + - - 26 + - 18.5392 + - - - 1856 + - 5056 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 5056 + - - 1 + - 2114.69 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 2368 + - - 6 + - 3800.22 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 4288 + - - 14 + - 4335.12 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 5888 + - - 14 + - 3744.67 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 64 + - - 6 + - 1820.7 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 64 + - - 6 + - 3311.04 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 256 + - - 6 + - 2406.33 + - - - 64 + - 5888 + - 1 + - 128 + - 64 + - 64 + - 128 + - 5888 + - - 2 + - 459.551 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 448 + - - 18 + - 3261.15 + - - - 5888 + - 1024 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 1024 + - - 3 + - 1486.43 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 2944 + - - 14 + - 4327.23 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 4288 + - - 14 + - 4079.0 + - - - 128 + - 128 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 2 + - 24.8242 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1408 + - - 14 + - 4148.84 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 128 + - - 10 + - 2487.01 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 4 + - - 26 + - 173.019 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 448 + - - 6 + - 2533.32 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1856 + - - 26 + - 82.3935 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 448 + - - 6 + - 3006.16 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 2368 + - - 14 + - 3958.7 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 128 + - - 6 + - 1927.86 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3584 + - - 16 + - 4128.97 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 256 + - 704 + - - 6 + - 1572.05 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 2944 + - - 14 + - 4052.77 + - - - 128 + - 1024 + - 1 + - 128 + - 128 + - 128 + - 128 + - 1024 + - - 2 + - 192.753 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1856 + - - 26 + - 155.564 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 4288 + - - 14 + - 3844.0 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1024 + - - 26 + - 92.5837 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 5888 + - - 14 + - 4439.56 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 4288 + - - 14 + - 4223.36 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1408 + - - 21 + - 1963.16 + - - - 1856 + - 6784 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 6784 + - - 4 + - 2107.3 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 256 + - 64 + - - 28 + - 1.68214 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1408 + - - 6 + - 3221.42 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 5888 + - - 14 + - 4418.72 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 2368 + - - 14 + - 4154.2 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 256 + - - 14 + - 3357.33 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 5888 + - - 6 + - 2939.2 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 256 + - 2944 + - - 6 + - 1065.25 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 5056 + - - 14 + - 4209.84 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 704 + - - 18 + - 3873.6 + - - - 1408 + - 5056 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 5056 + - - 3 + - 1828.28 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 4 + - - 26 + - 131.073 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1856 + - - 6 + - 979.662 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 64 + - - 6 + - 773.77 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 2944 + - - 6 + - 3364.88 + - - - 1408 + - 128 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 2 + - 259.549 + - - - 64 + - 3584 + - 1 + - 128 + - 64 + - 64 + - 128 + - 3584 + - - 2 + - 310.23 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 768 + - 128 + - - 6 + - 771.012 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 4 + - - 26 + - 64.8804 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 6784 + - - 14 + - 4264.23 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1024 + - - 16 + - 4073.76 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 4 + - - 24 + - 104.693 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 64 + - - 6 + - 1239.87 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 3584 + - - 14 + - 4231.49 + - - - 2368 + - 2368 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 2368 + - - 3 + - 1930.68 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 2368 + - - 7 + - 2678.24 + - - - 4 + - 5056 + - 1 + - 128 + - 4 + - 4 + - 128 + - 5056 + - - 23 + - 44.3878 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1408 + - - 6 + - 2735.11 + - - - 2944 + - 704 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 704 + - - 3 + - 1162.33 + - - - 4288 + - 2368 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 2368 + - - 3 + - 2005.23 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1408 + - - 14 + - 3959.2 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 5888 + - - 14 + - 3975.22 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 64 + - - 13 + - 666.972 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 256 + - 4 + - - 29 + - 9.47835 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 2944 + - - 6 + - 3646.63 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1856 + - - 6 + - 3150.96 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 2944 + - - 14 + - 4197.61 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 768 + - 2368 + - - 26 + - 98.8383 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 256 + - - 12 + - 2550.38 + - - - 4288 + - 5888 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 5888 + - - 3 + - 2271.12 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 4 + - - 24 + - 96.6558 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 256 + - 448 + - - 17 + - 364.813 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1408 + - - 14 + - 3841.47 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 6784 + - - 14 + - 4167.19 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 2944 + - - 6 + - 2851.7 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 5888 + - - 14 + - 3847.57 + - - - 2368 + - 6784 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 6784 + - - 3 + - 2206.67 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 1024 + - - 5 + - 1466.15 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5888 + - - 14 + - 2676.72 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1408 + - - 14 + - 4049.32 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 4 + - - 26 + - 96.496 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 5056 + - - 14 + - 4309.54 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 704 + - - 6 + - 3450.18 + - - - 2368 + - 256 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 256 + - - 2 + - 706.433 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 256 + - 2368 + - - 28 + - 40.4678 + - - - 4288 + - 1408 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 1408 + - - 3 + - 1817.16 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 768 + - 4288 + - - 25 + - 158.022 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 5888 + - - 14 + - 4440.15 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 3584 + - - 14 + - 3824.23 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 256 + - - 14 + - 2749.03 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 128 + - - 6 + - 3511.33 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 1408 + - - 14 + - 3857.79 + - - - 6784 + - 2368 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 2368 + - - 3 + - 2136.24 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 5056 + - - 14 + - 4166.78 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 5056 + - - 6 + - 2490.6 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 256 + - 128 + - - 17 + - 107.436 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 5888 + - - 14 + - 3729.95 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 128 + - - 6 + - 1858.03 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1856 + - - 14 + - 3523.05 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 768 + - 2944 + - - 25 + - 118.501 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 1024 + - - 26 + - 135.449 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 4288 + - - 6 + - 3371.23 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 5888 + - - 14 + - 4152.54 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1024 + - - 16 + - 3911.83 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 704 + - - 6 + - 2511.23 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 6 + - 2348.81 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 5056 + - - 14 + - 4204.58 + - - - 4 + - 4 + - 1 + - 128 + - 4 + - 4 + - 128 + - 4 + - - 23 + - 0.0339976 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1408 + - - 7 + - 2521.34 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 768 + - 256 + - - 17 + - 562.239 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1024 + - - 12 + - 1222.83 + - - - 128 + - 64 + - 1 + - 128 + - 128 + - 128 + - 128 + - 64 + - - 2 + - 12.4239 + - - - 6784 + - 1856 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 1856 + - - 3 + - 2059.9 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1856 + - - 18 + - 4043.31 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 256 + - - 14 + - 3296.31 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 256 + - 128 + - - 6 + - 555.604 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 704 + - - 6 + - 2588.64 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 448 + - - 6 + - 2982.7 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 704 + - - 16 + - 3414.55 + - - - 1024 + - 5056 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 5056 + - - 4 + - 1525.84 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 128 + - - 10 + - 2334.7 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 5888 + - - 14 + - 4255.07 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 704 + - - 16 + - 3762.02 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 4288 + - - 5 + - 2247.76 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 768 + - 3584 + - - 6 + - 3179.8 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 128 + - - 6 + - 3288.44 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1024 + - - 14 + - 3922.5 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 704 + - - 6 + - 2146.1 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 768 + - 704 + - - 6 + - 1979.17 + - - - 3584 + - 4 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 4 + - - 22 + - 32.9093 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 3584 + - - 14 + - 4167.9 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 5888 + - - 14 + - 4135.56 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 3584 + - - 14 + - 3526.1 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 448 + - - 6 + - 3481.88 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 64 + - - 6 + - 553.471 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 768 + - 256 + - - 8 + - 142.47 + - - - 1024 + - 1856 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 1856 + - - 4 + - 1211.02 + - - - 4288 + - 1856 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 1856 + - - 3 + - 1905.95 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 768 + - 6784 + - - 6 + - 2845.11 + - - - 256 + - 5888 + - 1 + - 128 + - 256 + - 256 + - 128 + - 5888 + - - 4 + - 841.789 + - - - 704 + - 5888 + - 1 + - 128 + - 704 + - 704 + - 128 + - 5888 + - - 3 + - 1638.81 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 5888 + - - 14 + - 4209.39 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 704 + - - 6 + - 3413.65 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 5056 + - - 14 + - 4340.31 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 256 + - 4 + - - 25 + - 3.25726 + - - - 448 + - 4288 + - 1 + - 128 + - 448 + - 448 + - 128 + - 4288 + - - 4 + - 1417.73 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 2368 + - - 10 + - 2400.83 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1856 + - - 6 + - 3779.2 + - - - 2368 + - 704 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 704 + - - 3 + - 1337.0 + - - - 5056 + - 1408 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 1408 + - - 1 + - 1943.71 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 128 + - - 6 + - 2748.28 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 4 + - - 25 + - 168.114 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 256 + - 448 + - - 28 + - 9.41609 + - - - 2944 + - 448 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 448 + - - 3 + - 1000.12 + - - - 4 + - 2368 + - 1 + - 128 + - 4 + - 4 + - 128 + - 2368 + - - 22 + - 21.0491 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 6 + - 1035.4 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1408 + - - 14 + - 3806.17 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 704 + - - 16 + - 3949.24 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 3584 + - - 14 + - 4233.23 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 1408 + - - 14 + - 3365.77 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 256 + - 4288 + - - 6 + - 1365.76 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1856 + - - 6 + - 3329.36 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 4 + - - 26 + - 67.3915 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1856 + - - 14 + - 3188.1 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 6784 + - - 14 + - 4460.5 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 256 + - - 14 + - 3844.35 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 768 + - 704 + - - 6 + - 1485.11 + - - - 5056 + - 448 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 448 + - - 4 + - 1343.77 + - - - 6784 + - 704 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 704 + - - 3 + - 1772.56 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 2368 + - - 12 + - 2382.29 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 2368 + - - 14 + - 3920.37 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 128 + - - 6 + - 2191.05 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 448 + - - 10 + - 2753.19 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 256 + - 448 + - - 6 + - 1559.9 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 2944 + - - 6 + - 2894.43 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 4 + - - 24 + - 114.729 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 256 + - - 7 + - 2453.31 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 128 + - - 17 + - 212.693 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 1024 + - - 14 + - 4234.97 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 256 + - 6784 + - - 14 + - 2993.4 + - - - 4 + - 128 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 22 + - 1.12994 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 6784 + - - 14 + - 4278.9 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 4 + - - 29 + - 181.46 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1408 + - - 6 + - 2660.31 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 4 + - - 26 + - 65.8553 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 5056 + - - 14 + - 3919.88 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1408 + - - 14 + - 3974.25 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 256 + - 2368 + - - 6 + - 884.975 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 3584 + - - 14 + - 4458.34 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 6784 + - - 14 + - 4503.64 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 1408 + - - 14 + - 2638.89 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 5056 + - - 6 + - 3383.68 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 2944 + - - 14 + - 3778.86 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 689.853 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1024 + - - 16 + - 4142.52 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 5888 + - - 14 + - 4114.08 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 6784 + - - 14 + - 4210.19 + - - - 3584 + - 3584 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 3584 + - - 4 + - 1787.76 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 4 + - - 24 + - 67.877 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 768 + - 256 + - - 26 + - 15.147 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 4 + - - 26 + - 0.470341 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 6784 + - - 14 + - 4442.22 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 704 + - - 5 + - 2582.05 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3584 + - - 6 + - 3561.79 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 256 + - - 6 + - 2846.41 + - - - 1856 + - 4288 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 4288 + - - 3 + - 1925.26 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1024 + - - 18 + - 3593.02 + - - - 256 + - 2944 + - 1 + - 128 + - 256 + - 256 + - 128 + - 2944 + - - 2 + - 628.381 + - - - 704 + - 1856 + - 1 + - 128 + - 704 + - 704 + - 128 + - 1856 + - - 3 + - 1019.31 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 64 + - - 5 + - 1883.08 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 4288 + - - 14 + - 3453.09 + - - - 5056 + - 4 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 4 + - - 22 + - 46.4924 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 5888 + - - 14 + - 4243.3 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 6784 + - - 14 + - 4423.66 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 4288 + - - 15 + - 2207.68 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 4288 + - - 6 + - 2818.88 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 256 + - 1408 + - - 6 + - 554.535 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 2944 + - - 14 + - 4090.91 + - - - 3584 + - 1024 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 1024 + - - 4 + - 1365.91 + - - - 6784 + - 448 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 448 + - - 1 + - 1454.61 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 4 + - - 26 + - 39.7003 + - - - 4 + - 1024 + - 1 + - 128 + - 4 + - 4 + - 128 + - 1024 + - - 23 + - 9.34901 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4288 + - - 6 + - 2314.05 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 6784 + - - 6 + - 3378.55 + - - - 5056 + - 64 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 64 + - - 2 + - 421.951 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 5888 + - - 14 + - 4365.29 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 3584 + - - 16 + - 4031.21 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 4 + - - 25 + - 203.742 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1856 + - - 18 + - 3916.08 + - - - 5888 + - 1856 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 1856 + - - 4 + - 1818.52 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 3584 + - - 14 + - 4133.01 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 256 + - 1856 + - - 6 + - 2547.96 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 5056 + - - 14 + - 3944.87 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 256 + - 448 + - - 6 + - 1122.82 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 4288 + - - 16 + - 4356.68 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 1856 + - - 16 + - 4130.38 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 704 + - - 6 + - 3118.74 + - - - 704 + - 1024 + - 1 + - 128 + - 704 + - 704 + - 128 + - 1024 + - - 2 + - 813.997 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 2944 + - - 14 + - 4112.91 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 64 + - - 6 + - 894.772 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 256 + - 5888 + - - 6 + - 1786.46 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 64 + - - 6 + - 1804.93 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 4288 + - - 14 + - 4305.44 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 6784 + - - 6 + - 3380.28 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 704 + - - 6 + - 1959.96 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 1024 + - - 16 + - 3444.88 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 768 + - 2944 + - - 6 + - 3181.95 + - - - 64 + - 448 + - 1 + - 128 + - 64 + - 64 + - 128 + - 448 + - - 2 + - 42.5954 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 128 + - - 6 + - 1510.8 + - - - 4288 + - 448 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 448 + - - 3 + - 1419.04 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 6784 + - - 14 + - 4189.55 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 1408 + - - 14 + - 4257.5 + - - - 448 + - 5056 + - 1 + - 128 + - 448 + - 448 + - 128 + - 5056 + - - 3 + - 1355.83 + - - - 3584 + - 5056 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 5056 + - - 4 + - 1979.33 + - - - 1856 + - 5888 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 5888 + - - 1 + - 2091.51 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 4288 + - - 14 + - 4300.73 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 768 + - 64 + - - 17 + - 392.502 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 768 + - 1856 + - - 6 + - 1878.63 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 256 + - - 9 + - 391.484 + - - - 448 + - 4 + - 1 + - 128 + - 448 + - 448 + - 128 + - 4 + - - 22 + - 4.39085 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 4288 + - - 14 + - 4042.25 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 448 + - - 14 + - 3411.7 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 64 + - - 5 + - 1318.51 + - - - 1408 + - 5888 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 5888 + - - 3 + - 1882.83 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 768 + - 3584 + - - 12 + - 1691.25 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 256 + - 5056 + - - 14 + - 3358.94 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 256 + - 6784 + - - 14 + - 3913.7 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 1856 + - - 18 + - 3958.11 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 1856 + - - 14 + - 3954.34 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 256 + - - 6 + - 3640.08 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 768 + - 1856 + - - 6 + - 3139.23 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 768 + - 448 + - - 26 + - 24.7172 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 4288 + - - 14 + - 3951.93 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 4288 + - - 14 + - 4229.92 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 704 + - - 6 + - 2310.26 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 1856 + - - 14 + - 3792.69 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 768 + - 256 + - - 17 + - 285.456 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 704 + - - 12 + - 2801.05 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 704 + - - 26 + - 67.6807 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 4288 + - - 6 + - 3680.17 + - - - 128 + - 6784 + - 1 + - 128 + - 128 + - 128 + - 128 + - 6784 + - - 2 + - 837.975 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 704 + - - 14 + - 3474.57 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 768 + - 6784 + - - 24 + - 204.64 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 768 + - 6784 + - - 14 + - 3530.04 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 128 + - - 26 + - 20.5789 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 448 + - - 6 + - 3301.27 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1856 + - - 14 + - 4279.93 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 1408 + - - 6 + - 3645.25 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 256 + - - 11 + - 782.103 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 1024 + - - 14 + - 3578.29 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 4288 + - - 14 + - 4353.68 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 1856 + - - 14 + - 3270.0 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 2368 + - - 14 + - 4064.93 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 1408 + - - 6 + - 2761.45 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 256 + - 2944 + - - 6 + - 2537.89 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 256 + - 5888 + - - 14 + - 3450.7 + - - - 1408 + - 4 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 4 + - - 22 + - 13.3106 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 4 + - - 26 + - 5.80993 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 256 + - 6784 + - - 6 + - 2124.41 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 1024 + - - 14 + - 3360.12 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 4 + - - 24 + - 82.9858 + - - - 448 + - 64 + - 1 + - 128 + - 448 + - 448 + - 128 + - 64 + - - 2 + - 41.5536 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 64 + - - 19 + - 86.8026 + - - - 256 + - 6784 + - 1 + - 128 + - 256 + - 256 + - 128 + - 6784 + - - 4 + - 1128.19 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 256 + - - 10 + - 3293.34 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 704 + - - 6 + - 2674.29 + - - - 6784 + - 5888 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 5888 + - - 3 + - 2291.94 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 256 + - 448 + - - 17 + - 185.73 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 5888 + - - 14 + - 4196.68 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 128 + - - 6 + - 773.857 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 64 + - - 6 + - 2889.09 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 6784 + - - 14 + - 4416.18 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 768 + - 1408 + - - 26 + - 64.5964 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 2944 + - - 18 + - 3911.1 + - - - 704 + - 2368 + - 1 + - 128 + - 704 + - 704 + - 128 + - 2368 + - - 3 + - 1279.29 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 128 + - - 6 + - 1492.8 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 256 + - - 6 + - 3491.81 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 3584 + - - 12 + - 2023.64 + - - - 256 + - 704 + - 1 + - 128 + - 256 + - 256 + - 128 + - 704 + - - 2 + - 253.837 + - - - 704 + - 448 + - 1 + - 128 + - 704 + - 704 + - 128 + - 448 + - - 2 + - 418.431 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 64 + - - 11 + - 1056.26 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 64 + - - 8 + - 273.678 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1408 + - - 16 + - 3733.68 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 4 + - - 29 + - 85.4561 + - - - 1024 + - 448 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 448 + - - 2 + - 524.288 + - - - 4288 + - 1024 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 1024 + - - 3 + - 1680.33 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 768 + - 6784 + - - 6 + - 3315.91 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 2944 + - - 14 + - 4143.93 + - - - 1408 + - 2368 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 2368 + - - 1 + - 1529.87 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 5888 + - - 14 + - 4143.37 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 256 + - - 11 + - 1136.43 + - - - 5888 + - 128 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 2 + - 793.853 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 1024 + - - 14 + - 3841.0 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 64 + - - 17 + - 408.006 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 2368 + - - 6 + - 1876.08 + - - - 448 + - 5888 + - 1 + - 128 + - 448 + - 448 + - 128 + - 5888 + - - 4 + - 1484.01 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 704 + - - 14 + - 3667.12 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 64 + - - 11 + - 967.458 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 2368 + - - 14 + - 4284.79 + - - - 704 + - 64 + - 1 + - 128 + - 704 + - 704 + - 128 + - 64 + - - 2 + - 64.8288 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 4288 + - - 14 + - 3888.22 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 64 + - - 6 + - 2386.66 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 4288 + - - 14 + - 3815.81 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 1024 + - - 6 + - 3342.81 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 5056 + - - 7 + - 2813.78 + - - - 256 + - 2368 + - 1 + - 128 + - 256 + - 256 + - 128 + - 2368 + - - 2 + - 549.226 + - - - 2368 + - 4288 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 4288 + - - 3 + - 2038.44 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 1024 + - - 14 + - 3753.73 + - - - 4 + - 1856 + - 1 + - 128 + - 4 + - 4 + - 128 + - 1856 + - - 22 + - 16.5439 + - - - 5888 + - 6784 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 6784 + - - 4 + - 2078.06 + - - - 5056 + - 256 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 256 + - - 3 + - 983.351 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 4288 + - - 18 + - 4121.48 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 256 + - - 26 + - 40.764 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 3584 + - - 6 + - 3451.82 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 4 + - - 26 + - 124.415 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 4288 + - - 10 + - 3468.87 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 704 + - - 18 + - 3772.65 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 4288 + - - 18 + - 3925.89 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 768 + - 1024 + - - 17 + - 564.256 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 2944 + - - 18 + - 4067.41 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 4 + - - 26 + - 0.655768 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3584 + - - 14 + - 3859.06 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 448 + - - 12 + - 2291.16 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1856 + - - 6 + - 3497.55 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 448 + - - 6 + - 2337.78 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 2944 + - - 12 + - 1721.96 + - - - 5888 + - 2944 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 2944 + - - 3 + - 1793.74 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 1024 + - - 14 + - 3589.57 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 3584 + - - 14 + - 4256.09 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 768 + - 5888 + - - 14 + - 3117.94 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 128 + - - 19 + - 145.636 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 256 + - - 6 + - 1683.49 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3584 + - - 18 + - 3951.38 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 1024 + - - 14 + - 3278.18 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 448 + - - 6 + - 2293.76 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 768 + - 256 + - - 6 + - 1487.66 + - - - 1408 + - 4288 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 4288 + - - 3 + - 1788.56 + - - - 2368 + - 4 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 4 + - - 22 + - 21.8377 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 2368 + - - 14 + - 3825.21 + - - - 3584 + - 256 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 256 + - - 2 + - 870.704 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1024 + - - 6 + - 3161.86 + - - - 1408 + - 256 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 256 + - - 2 + - 462.855 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 448 + - - 18 + - 3810.3 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 1856 + - - 14 + - 3378.74 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 448 + - - 10 + - 2473.66 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 5888 + - - 25 + - 350.292 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 2368 + - - 14 + - 3857.82 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 448 + - - 14 + - 3300.17 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 256 + - 128 + - - 17 + - 52.6394 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 2368 + - - 14 + - 4144.19 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 448 + - - 6 + - 3238.59 + - - - 2944 + - 5888 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 5888 + - - 1 + - 2121.21 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 448 + - - 6 + - 685.984 +- null diff --git a/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml new file mode 100644 index 000000000..69c035b52 --- /dev/null +++ b/HostLibraryTests/configs/lite_configs_mixed/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml @@ -0,0 +1,19239 @@ +- MinimumRequiredVersion: 4.12.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 3072 + LdsOffsetA: 0 + LdsOffsetB: 1024 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsOffsetA: 0 + LdsOffsetB: 2048 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: false + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x64x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 32 + LSCB: 32 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 32 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 4 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 16 + LSCB: 16 + LSPA: 16 + LSPB: 16 + LVCA: 4 + LVCB: 4 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS2_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 64 + LVCA: 8 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 32 + LVCA: 4 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 8 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x32x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 9 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 10 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU8_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 5120 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 1 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 11 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x128x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 12 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsA: 2 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 13 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 32 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 64 + MacroTile1: 128 + MacroTileA: 64 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 2 + NumLoadsB: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 4 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 14 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x128x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 64 + LVCA: 8 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 15 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 64 + LVCA: 8 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 512 + LdsOffsetB_Blk: 2560 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 64 + MacroTileA: 32 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 16 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x64x16_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 8 + ThreadTile0: 4 + ThreadTile1: 8 + ThreadTileA: 4 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 7168 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 8 + NumLoadsA: 2 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 17 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x64x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 18 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x16_SE_AMAS3_GRVW4_GSU1_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 32 + LVCA: 4 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 19 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x32x16_SE_AMAS3_GRVW4_GSU4_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 32 + LVPB: 32 + LdcEqualsLdd: true + LdsNumElements: 3584 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 128 + MacroTile1: 64 + MacroTileA: 128 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 32 + NumGlobalWriteVectorsPerThread: 32 + NumLoadsA: 4 + NumLoadsB: 2 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 4 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 20 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x64x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 32 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 32 + LSCB: 32 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 8 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 21 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x32_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 1 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BenchmarkFork: 0 + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 32 + LVCA: 4 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 32 + MacroTileA: 64 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 8 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 22 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x32x16_SE_AMAS3_GRVW4_GSU2_VW4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 4 + ThreadTile0: 8 + ThreadTile1: 4 + ThreadTileA: 8 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 8 + WorkGroupMappingType: B + _staggerStrideShift: 2 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 2 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 2 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 4 + LSCB: 4 + LSPA: 16 + LSPB: 16 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 2 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 23 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT16x16x4_SE_AMAS2_GRVW2_GSU1_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: false + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 4 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: false + FractionalLoad: false + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 0 + - 0 + - 0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Source + LSCA: 4 + LSCB: 4 + LSPA: 16 + LSPB: 16 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 16 + MacroTile1: 16 + MacroTileA: 16 + MacroTileB: 16 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 24 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT16x16x4_SE_AMAS0_GRVW1_GSU1_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 0 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 8 + - 8 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 4 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 25 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU2_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 26 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU4_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 2 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 27 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS3_GRVW2_GSU8_VW2 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 2 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 2 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 28 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU2_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 29 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU4_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 0 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 8 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 0 + GlobalLoadVectorWidthA: 1 + GlobalLoadVectorWidthB: 1 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 1 + GlobalSplitU: 8 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 1 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 8 + LSCB: 8 + LSPA: 8 + LSPB: 8 + LVCA: 8 + LVCB: 8 + LVPA: 8 + LVPB: 8 + LdcEqualsLdd: true + LdsNumElements: 409 + LdsNumElementsAlignedA: 64 + LdsNumElementsAlignedB: 64 + LdsOffsetA: 0 + LdsOffsetA_Blk: 128 + LdsOffsetB: 64 + LdsOffsetB_Blk: 192 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 2 + MacroTile0: 8 + MacroTile1: 8 + MacroTileA: 8 + MacroTileB: 8 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 1 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsA: 1 + NumLoadsB: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 64 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: false + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 30 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT8x8x8_SE_AMAS0_GRVW1_GSU8_VW1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 4 + SubGroup1: 4 + SubGroupA: 4 + SubGroupB: 4 + SuppressNoLoadLoop: false + ThreadTile: + - 2 + - 2 + ThreadTile0: 2 + ThreadTile1: 2 + ThreadTileA: 2 + ThreadTileB: 2 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 1 + WorkGroup: + - 4 + - 4 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 3 +- - 2 + - 3 + - 0 + - 1 +- - - - 6784 + - 448 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 12 + - 2943.57 + - - - 1856 + - 6784 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 4030.09 + - - - 704 + - 448 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 14 + - 2175.48 + - - - 2944 + - 704 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 8 + - 3058.29 + - - - 3584 + - 4288 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2020.31 + - - - 704 + - 1856 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 12 + - 2918.47 + - - - 4 + - 3584 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 33.0993 + - - - 5056 + - 1856 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2128.18 + - - - 3584 + - 2368 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1823.18 + - - - 1408 + - 2944 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3301.5 + - - - 128 + - 4 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 23 + - 1.26812 + - - - 64 + - 1024 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 84.223 + - - - 1408 + - 1024 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 2912.71 + - - - 3584 + - 5056 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 13 + - 3954.96 + - - - 704 + - 4 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 27 + - 67.4635 + - - - 1408 + - 128 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 15 + - 1769.49 + - - - 2368 + - 2944 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 13 + - 3795.25 + - - - 3584 + - 1024 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 13 + - 3309.12 + - - - 2368 + - 2368 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 11 + - 3898.8 + - - - 128 + - 128 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 316.927 + - - - 256 + - 4 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 27 + - 28.1789 + - - - 4288 + - 5888 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 11 + - 3885.39 + - - - 448 + - 5888 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2938.06 + - - - 256 + - 2368 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 570.549 + - - - 5888 + - 5888 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 13 + - 4257.51 + - - - 3584 + - 4 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 25 + - 117.715 + - - - 1856 + - 2944 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 13 + - 3791.67 + - - - 704 + - 4 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 27 + - 36.0448 + - - - 64 + - 256 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 126.64 + - - - 1856 + - 128 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 8 + - 1840.72 + - - - 5888 + - 4 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 30 + - 65.0705 + - - - 4288 + - 704 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 2925.5 + - - - 6784 + - 128 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 12 + - 3041.21 + - - - 3584 + - 6784 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 4076.21 + - - - 2368 + - 3584 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2093.92 + - - - 1408 + - 4 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 26 + - 24.9618 + - - - 448 + - 448 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 1583.2 + - - - 4 + - 1408 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 30 + - 63.9092 + - - - 5056 + - 256 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 950.407 + - - - 1856 + - 5056 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3919.67 + - - - 5056 + - 704 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4014.64 + - - - 4288 + - 448 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 17 + - 3871.78 + - - - 256 + - 6784 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 11 + - 2962.39 + - - - 3584 + - 2368 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3884.3 + - - - 5056 + - 4 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 28 + - 65.1178 + - - - 704 + - 1024 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 2657.68 + - - - 2944 + - 256 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 12 + - 2601.64 + - - - 2944 + - 256 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 12 + - 2644.21 + - - - 6784 + - 64 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 8 + - 2748.88 + - - - 6784 + - 1408 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2037.19 + - - - 4288 + - 5888 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4051.46 + - - - 4288 + - 2944 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3964.71 + - - - 64 + - 2368 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 1125.21 + - - - 1408 + - 4288 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1802.58 + - - - 1408 + - 3584 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1707.71 + - - - 1408 + - 5056 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 13 + - 4045.69 + - - - 1856 + - 1856 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 13 + - 3092.05 + - - - 1024 + - 4288 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 17 + - 3493.15 + - - - 2944 + - 1408 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 8 + - 3326.29 + - - - 2368 + - 4 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 26 + - 40.8496 + - - - 4288 + - 5888 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4134.11 + - - - 1024 + - 6784 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 13 + - 3655.82 + - - - 3584 + - 4288 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 13 + - 4280.89 + - - - 6784 + - 256 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 11 + - 3407.39 + - - - 2368 + - 1856 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 11 + - 3507.78 + - - - 4288 + - 1408 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3446.52 + - - - 2368 + - 6784 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3706.31 + - - - 1024 + - 128 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 6 + - 1127.5 + - - - 448 + - 704 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2004.76 + - - - 4288 + - 4288 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 11 + - 3764.68 + - - - 5888 + - 1408 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1861.42 + - - - 5056 + - 5888 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 13 + - 3881.64 + - - - 128 + - 1408 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1046.67 + - - - 2944 + - 6784 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 17 + - 3968.68 + - - - 1024 + - 5888 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 17 + - 3432.04 + - - - 2944 + - 704 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 8 + - 2996.75 + - - - 3584 + - 5056 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3735.99 + - - - 6784 + - 4 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 27 + - 193.541 + - - - 704 + - 2944 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 3111.93 + - - - 2944 + - 1856 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3682.09 + - - - 3584 + - 128 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 8 + - 2610.56 + - - - 128 + - 1856 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 277.654 + - - - 5056 + - 64 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 8 + - 2048.69 + - - - 5888 + - 6784 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4169.73 + - - - 1856 + - 3584 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3872.86 + - - - 2368 + - 1856 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1784.32 + - - - 5888 + - 5056 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 13 + - 4098.87 + - - - 1408 + - 4288 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3255.82 + - - - 4288 + - 4 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 26 + - 67.9287 + - - - 2368 + - 64 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 5 + - 1292.26 + - - - 448 + - 1408 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 8 + - 1898.88 + - - - 5888 + - 1408 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3480.58 + - - - 1856 + - 704 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 12 + - 3009.91 + - - - 4 + - 2944 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 27.0715 + - - - 5056 + - 256 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 12 + - 2618.13 + - - - 4 + - 1024 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 17.9305 + - - - 1408 + - 2944 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1623.96 + - - - 448 + - 5888 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1622.03 + - - - 1856 + - 256 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 3 + - 531.993 + - - - 2368 + - 64 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 5 + - 1602.99 + - - - 1024 + - 256 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 8 + - 1670.56 + - - - 2944 + - 4288 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 17 + - 4025.95 + - - - 704 + - 1024 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 2814.72 + - - - 1856 + - 4 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 27 + - 206.72 + - - - 5888 + - 64 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 8 + - 1715.31 + - - - 256 + - 256 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 18 + - 682.37 + - - - 448 + - 6784 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2944.46 + - - - 1408 + - 2368 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 13 + - 3702.04 + - - - 5056 + - 1024 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 11 + - 3532.77 + - - - 6784 + - 704 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3313.75 + - - - 5056 + - 448 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 8 + - 3023.9 + - - - 128 + - 5056 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 625.661 + - - - 5056 + - 2944 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4097.22 + - - - 704 + - 3584 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 11 + - 3194.21 + - - - 5888 + - 1024 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1765.54 + - - - 4 + - 4288 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 39.261 + - - - 5888 + - 448 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 3342.61 + - - - 704 + - 4288 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1489.36 + - - - 448 + - 1856 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 12 + - 2740.23 + - - - 128 + - 5888 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 12 + - 2594.05 + - - - 64 + - 64 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 5.116 + - - - 1024 + - 3584 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 13 + - 4012.71 + - - - 2368 + - 1024 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 8 + - 3246.64 + - - - 4 + - 704 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 6.40006 + - - - 128 + - 3584 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2830.09 + - - - 4 + - 1024 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 91.8428 + - - - 5888 + - 2944 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2074.41 + - - - 256 + - 2944 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 4 + - 680.893 + - - - 5056 + - 3584 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4142.97 + - - - 448 + - 704 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 1848.45 + - - - 6784 + - 2944 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 3965.71 + - - - 4288 + - 256 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 2240.26 + - - - 2368 + - 1856 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 17 + - 3486.99 + - - - 448 + - 6784 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 13 + - 3178.98 + - - - 256 + - 3584 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 3044.44 + - - - 5056 + - 704 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 3940.45 + - - - 1408 + - 704 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 20 + - 2643.46 + - - - 128 + - 256 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 41.1206 + - - - 1024 + - 1856 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 17 + - 3247.06 + - - - 2368 + - 1024 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 12 + - 3130.08 + - - - 4 + - 2368 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 29 + - 94.6214 + - - - 2944 + - 1408 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 12 + - 3244.21 + - - - 704 + - 5056 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 13 + - 4014.32 + - - - 704 + - 448 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 1858.66 + - - - 2944 + - 4288 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 17 + - 3954.88 + - - - 4 + - 128 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 7.8019 + - - - 4 + - 3584 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 25 + - 68.3061 + - - - 448 + - 5888 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 11 + - 3315.82 + - - - 4 + - 2944 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 26 + - 192.543 + - - - 5888 + - 256 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 2967.67 + - - - 128 + - 128 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 18 + - 172.463 + - - - 4288 + - 2944 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 11 + - 3751.87 + - - - 256 + - 2368 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 2316.85 + - - - 5888 + - 1856 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4137.71 + - - - 704 + - 5056 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 13 + - 3712.17 + - - - 4 + - 3584 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 29 + - 132.972 + - - - 704 + - 5888 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 3308.8 + - - - 5888 + - 704 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 3301.03 + - - - 448 + - 64 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 483.624 + - - - 3584 + - 2368 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3509.71 + - - - 4288 + - 64 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 3 + - 324.772 + - - - 128 + - 4288 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 530.624 + - - - 1856 + - 6784 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3743.18 + - - - 4 + - 64 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 30 + - 1.64498 + - - - 256 + - 704 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 215.193 + - - - 4288 + - 1856 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 1993.68 + - - - 5888 + - 2368 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3646.66 + - - - 1856 + - 5056 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3562.96 + - - - 5888 + - 5888 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4401.47 + - - - 6784 + - 1408 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 11 + - 3923.75 + - - - 4 + - 6784 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 26 + - 170.936 + - - - 2368 + - 4 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 26 + - 194.298 + - - - 128 + - 3584 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 2000.01 + - - - 4 + - 256 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 39.7373 + - - - 2368 + - 1024 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 12 + - 3355.2 + - - - 1024 + - 256 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 8 + - 1718.16 + - - - 2944 + - 2368 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 17 + - 3307.9 + - - - 704 + - 5056 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 13 + - 3933.26 + - - - 1024 + - 5056 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 17 + - 3591.48 + - - - 6784 + - 2944 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 3946.89 + - - - 1408 + - 128 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 1432.24 + - - - 6784 + - 2944 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3772.77 + - - - 2944 + - 64 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 3 + - 226.496 + - - - 64 + - 4 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 27 + - 4.33439 + - - - 128 + - 2368 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1750.78 + - - - 64 + - 704 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 348.259 + - - - 2368 + - 5056 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 17 + - 3814.29 + - - - 704 + - 5888 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 3277.49 + - - - 448 + - 1408 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 2535.08 + - - - 256 + - 1024 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 8 + - 1200.09 + - - - 4 + - 6784 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 92.084 + - - - 5888 + - 64 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 8 + - 2466.36 + - - - 3584 + - 1408 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 11 + - 3446.52 + - - - 4288 + - 1856 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 11 + - 3628.42 + - - - 3584 + - 1856 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1793.87 + - - - 6784 + - 1024 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 13 + - 3389.72 + - - - 5056 + - 2368 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3555.34 + - - - 128 + - 448 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 785.15 + - - - 256 + - 2944 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 12 + - 2117.41 + - - - 2944 + - 448 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 8 + - 2898.71 + - - - 3584 + - 1856 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3844.44 + - - - 4288 + - 4 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 23 + - 39.487 + - - - 1024 + - 1408 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 12 + - 3197.32 + - - - 1856 + - 1024 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3735.71 + - - - 448 + - 2368 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2156.78 + - - - 1024 + - 6784 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 13 + - 3923.21 + - - - 1408 + - 2368 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 13 + - 3768.93 + - - - 64 + - 4 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 27 + - 7.77019 + - - - 128 + - 704 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1338.33 + - - - 5888 + - 1408 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 11 + - 3775.83 + - - - 6784 + - 1856 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3715.56 + - - - 2368 + - 2368 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 11 + - 3788.54 + - - - 2368 + - 128 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 8 + - 1385.62 + - - - 3584 + - 6784 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 4089.55 + - - - 2368 + - 3584 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3546.84 + - - - 64 + - 3584 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 18 + - 1869.05 + - - - 6784 + - 256 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 11 + - 3590.44 + - - - 704 + - 2368 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 17 + - 2813.62 + - - - 4288 + - 4288 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4200.33 + - - - 3584 + - 1856 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3429.92 + - - - 128 + - 128 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 453.174 + - - - 1856 + - 128 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 8 + - 1288.5 + - - - 3584 + - 448 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 2757.93 + - - - 2944 + - 1856 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 3843.19 + - - - 1024 + - 5056 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 3265.82 + - - - 448 + - 64 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 18 + - 221.619 + - - - 2368 + - 5888 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 13 + - 3866.96 + - - - 4 + - 5888 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 53.6802 + - - - 1856 + - 5056 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 2132.41 + - - - 5056 + - 4288 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4091.25 + - - - 5888 + - 4 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 25 + - 129.91 + - - - 6784 + - 448 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 3174.83 + - - - 64 + - 1408 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 1321.81 + - - - 1024 + - 3584 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1464.35 + - - - 448 + - 2944 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 2964.17 + - - - 64 + - 1024 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 988.505 + - - - 4 + - 1024 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 48.0117 + - - - 704 + - 128 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 1347.95 + - - - 2944 + - 6784 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3940.81 + - - - 4288 + - 1024 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 1778.6 + - - - 1408 + - 256 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 3 + - 427.514 + - - - 3584 + - 6784 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3841.81 + - - - 704 + - 704 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 7 + - 2221.25 + - - - 1408 + - 6784 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 2040.18 + - - - 6784 + - 448 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 1 + - 1378.73 + - - - 4 + - 2944 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 25 + - 158.538 + - - - 4288 + - 2368 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 3860.23 + - - - 64 + - 128 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 63.1672 + - - - 256 + - 128 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 18 + - 349.914 + - - - 2944 + - 2944 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 11 + - 3614.13 + - - - 1856 + - 2944 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1932.9 + - - - 128 + - 64 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 5 + - 92.9589 + - - - 64 + - 704 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 477.415 + - - - 3584 + - 128 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 8 + - 2880.06 + - - - 256 + - 1856 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 3101.47 + - - - 128 + - 6784 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 12 + - 2990.64 + - - - 1856 + - 4288 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1988.7 + - - - 64 + - 64 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 27.8877 + - - - 2368 + - 6784 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2192.74 + - - - 3584 + - 3584 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 11 + - 3607.21 + - - - 1408 + - 5888 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 11 + - 3719.54 + - - - 2944 + - 4 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 23 + - 27.1495 + - - - 256 + - 448 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 936.229 + - - - 2368 + - 5056 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 17 + - 3540.88 + - - - 448 + - 4 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 27 + - 46.2452 + - - - 2368 + - 4288 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3489.34 + - - - 5888 + - 256 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1044.49 + - - - 448 + - 2944 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2911.28 + - - - 4 + - 6784 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 97.5212 + - - - 128 + - 704 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 639.376 + - - - 256 + - 2944 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 12 + - 2602.85 + - - - 256 + - 128 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 534.988 + - - - 4 + - 704 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 27 + - 13.1743 + - - - 448 + - 6784 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 13 + - 3359.6 + - - - 1024 + - 1024 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 12 + - 2427.02 + - - - 2368 + - 5888 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2166.5 + - - - 1408 + - 3584 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3192.58 + - - - 1856 + - 64 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 3 + - 145.413 + - - - 4 + - 704 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 30 + - 35.0176 + - - - 128 + - 704 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 998.767 + - - - 128 + - 4 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 27 + - 20.2464 + - - - 128 + - 1856 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 22 + - 2233.92 + - - - 1408 + - 1408 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 20 + - 2886.11 + - - - 4288 + - 2944 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 11 + - 3791.37 + - - - 5056 + - 1408 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 1987.81 + - - - 6784 + - 3584 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 4079.08 + - - - 3584 + - 448 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3323.76 + - - - 128 + - 2944 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2139.32 + - - - 1408 + - 448 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 2447.1 + - - - 448 + - 5056 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2941.67 + - - - 256 + - 448 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 18 + - 756.704 + - - - 1024 + - 1408 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 937.37 + - - - 5056 + - 5056 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4177.95 + - - - 2944 + - 704 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 12 + - 2873.17 + - - - 4288 + - 128 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 8 + - 2099.84 + - - - 5888 + - 2944 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 11 + - 3976.61 + - - - 4288 + - 4 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 26 + - 151.063 + - - - 448 + - 1024 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 515.452 + - - - 4 + - 1408 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 24.2237 + - - - 128 + - 704 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 18 + - 905.838 + - - - 2944 + - 64 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 22 + - 1865.77 + - - - 448 + - 2368 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 2550.54 + - - - 128 + - 1024 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 170.778 + - - - 5056 + - 704 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3184.28 + - - - 256 + - 4 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 27 + - 38.6205 + - - - 448 + - 1408 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 2334.44 + - - - 3584 + - 2368 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 11 + - 3764.82 + - - - 2368 + - 1408 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 12 + - 3194.39 + - - - 1024 + - 704 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 12 + - 2523.29 + - - - 4 + - 1408 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 174.066 + - - - 1408 + - 2368 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1575.96 + - - - 1856 + - 2944 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3723.65 + - - - 3584 + - 2944 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 11 + - 3893.92 + - - - 4 + - 128 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 14.39 + - - - 256 + - 4288 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 2778.39 + - - - 448 + - 448 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 22 + - 1923.8 + - - - 3584 + - 1024 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 13 + - 4049.68 + - - - 2944 + - 1408 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 3303.38 + - - - 1024 + - 4 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 30 + - 18.2046 + - - - 1024 + - 64 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 5 + - 720.671 + - - - 4 + - 256 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 2.35404 + - - - 64 + - 5056 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 14 + - 2211.45 + - - - 704 + - 1024 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 8 + - 2139.95 + - - - 1024 + - 1408 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 2988.92 + - - - 704 + - 1024 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 726.344 + - - - 4288 + - 128 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 548.864 + - - - 5056 + - 2368 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 17 + - 3815.7 + - - - 64 + - 2368 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 15 + - 1505.39 + - - - 1408 + - 704 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 2359.49 + - - - 1856 + - 5888 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 13 + - 3979.44 + - - - 1408 + - 1024 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1059.17 + - - - 1024 + - 2944 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 13 + - 3405.1 + - - - 64 + - 4 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 23 + - 0.629192 + - - - 6784 + - 448 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 3422.91 + - - - 1408 + - 1856 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3285.08 + - - - 3584 + - 256 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 12 + - 3203.64 + - - - 5888 + - 1024 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 11 + - 3495.53 + - - - 1024 + - 448 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 474.162 + - - - 2368 + - 128 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 8 + - 1926.65 + - - - 1856 + - 64 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 18 + - 796.874 + - - - 128 + - 2368 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 1878.67 + - - - 64 + - 6784 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 8 + - 2248.16 + - - - 1024 + - 1024 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 8 + - 2559.45 + - - - 2368 + - 2944 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 13 + - 3923.01 + - - - 704 + - 2368 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1317.84 + - - - 1408 + - 5888 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 11 + - 3474.2 + - - - 1856 + - 2944 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 13 + - 3847.74 + - - - 4288 + - 704 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 1503.74 + - - - 6784 + - 704 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 3794.06 + - - - 2944 + - 1856 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1832.43 + - - - 1024 + - 1024 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 732.95 + - - - 2368 + - 704 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1245.25 + - - - 64 + - 64 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 88.9917 + - - - 128 + - 704 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 117.986 + - - - 5056 + - 5888 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4231.37 + - - - 704 + - 704 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 8 + - 1516.22 + - - - 4288 + - 2368 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 3812.62 + - - - 5888 + - 6784 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2176.35 + - - - 128 + - 448 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 436.907 + - - - 128 + - 5888 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 12 + - 2484.61 + - - - 64 + - 4288 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 319.107 + - - - 64 + - 6784 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 8 + - 1971.66 + - - - 64 + - 128 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 10.1922 + - - - 2944 + - 5888 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 4037.68 + - - - 3584 + - 4 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 25 + - 63.0823 + - - - 4288 + - 2944 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 11 + - 4012.7 + - - - 4 + - 6784 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 62.1144 + - - - 704 + - 64 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 5 + - 956.291 + - - - 2944 + - 448 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 8 + - 2949.99 + - - - 704 + - 448 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 8 + - 1433.6 + - - - 5888 + - 5888 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 4359.14 + - - - 1024 + - 448 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 8 + - 2980.96 + - - - 2944 + - 6784 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 11 + - 3775.0 + - - - 256 + - 64 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 18 + - 128.188 + - - - 4288 + - 256 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 8 + - 2585.42 + - - - 2944 + - 2944 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 17 + - 3962.38 + - - - 704 + - 704 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 6 + - 1908.51 + - - - 1856 + - 5056 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 17 + - 3907.43 + - - - 5888 + - 3584 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 11 + - 3816.24 + - - - 1024 + - 4 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 23 + - 9.72353 + - - - 1408 + - 3584 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 17 + - 3438.44 + - - - 448 + - 704 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 14 + - 2213.28 + - - - 64 + - 1856 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 151.801 + - - - 64 + - 5056 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 1336.09 + - - - 1856 + - 2944 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3415.04 + - - - 2944 + - 256 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 2138.05 + - - - 128 + - 5056 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 2501.83 + - - - 64 + - 256 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 20.5281 + - - - 704 + - 1408 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2047.74 + - - - 2944 + - 448 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 12 + - 2954.17 + - - - 64 + - 6784 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 12 + - 1473.34 + - - - 4288 + - 704 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 3179.73 + - - - 5888 + - 448 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 17 + - 3366.06 + - - - 5056 + - 1856 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 11 + - 3922.94 + - - - 4288 + - 448 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 2 + - 1388.9 + - - - 5888 + - 2368 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 3823.0 + - - - 128 + - 256 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 257.635 + - - - 1856 + - 4 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 29 + - 32.3662 + - - - 2944 + - 1856 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 17 + - 3366.39 + - - - 4288 + - 6784 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 11 + - 3894.22 + - - - 2368 + - 704 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 17 + - 2788.62 + - - - 128 + - 2368 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 354.249 + - - - 4 + - 2368 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 29 + - 39.8297 + - - - 3584 + - 5888 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2092.35 + - - - 3584 + - 1024 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1506.42 + - - - 4288 + - 3584 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2219.44 + - - - 2944 + - 1024 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 3422.66 + - - - 1024 + - 5888 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 11 + - 3504.78 + - - - 5056 + - 1024 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 12 + - 3272.27 + - - - 1024 + - 128 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 773.857 + - - - 6784 + - 2944 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2134.34 + - - - 448 + - 4288 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1477.0 + - - - 256 + - 4288 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 2538.1 + - - - 6784 + - 64 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 8 + - 2831.43 + - - - 2368 + - 4 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 27 + - 103.448 + - - - 1856 + - 2368 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3506.5 + - - - 3584 + - 4 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 24 + - 33.0516 + - - - 6784 + - 2368 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 3872.85 + - - - 6784 + - 5056 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 4317.51 + - - - 704 + - 128 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 3 + - 113.259 + - - - 64 + - 3584 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 1675.81 + - - - 5056 + - 64 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 3 + - 370.339 + - - - 704 + - 256 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 1603.9 + - - - 4288 + - 704 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 3409.54 + - - - 128 + - 2944 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2353.89 + - - - 3584 + - 1024 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 4126.96 + - - - 448 + - 256 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 18 + - 1128.08 + - - - 1024 + - 2944 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 13 + - 3151.21 + - - - 4 + - 448 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 4.1554 + - - - 1024 + - 2368 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1177.11 + - - - 1856 + - 448 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 12 + - 2744.0 + - - - 1856 + - 64 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 18 + - 1240.45 + - - - 6784 + - 1408 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 3988.18 + - - - 128 + - 448 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 18 + - 592.575 + - - - 64 + - 704 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 936.229 + - - - 448 + - 256 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 147.746 + - - - 6784 + - 1408 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 11 + - 3927.59 + - - - 6784 + - 2368 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2118.63 + - - - 3584 + - 1408 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 12 + - 3197.0 + - - - 2944 + - 6784 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2145.67 + - - - 1024 + - 1024 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 2131.79 + - - - 6784 + - 5888 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3928.5 + - - - 5056 + - 5056 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2232.84 + - - - 1856 + - 3584 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3779.49 + - - - 64 + - 4 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 29 + - 1.76172 + - - - 2944 + - 3584 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 11 + - 3660.47 + - - - 1856 + - 256 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 6 + - 3046.49 + - - - 5888 + - 4288 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4119.06 + - - - 4288 + - 1408 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 1881.58 + - - - 4288 + - 6784 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4146.25 + - - - 5888 + - 3584 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 4030.37 + - - - 64 + - 1408 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 637.961 + - - - 704 + - 6784 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 13 + - 3358.39 + - - - 256 + - 704 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 6 + - 1541.43 + - - - 5056 + - 1408 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 13 + - 3460.48 + - - - 2944 + - 3584 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2036.93 + - - - 5056 + - 5888 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4262.56 + - - - 704 + - 1856 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1031.38 + - - - 4 + - 3584 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 57.201 + - - - 1408 + - 64 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 5 + - 1052.4 + - - - 704 + - 5888 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1701.45 + - - - 1408 + - 1408 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 2590.4 + - - - 64 + - 1408 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 21 + - 922.536 + - - - 1024 + - 1408 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 12 + - 3301.59 + - - - 4288 + - 5056 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4100.33 + - - - 4288 + - 1856 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 17 + - 3623.32 + - - - 1408 + - 5888 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3778.27 + - - - 3584 + - 5888 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 4039.82 + - - - 448 + - 1856 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 845.223 + - - - 6784 + - 1856 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 3951.52 + - - - 704 + - 1024 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 2876.39 + - - - 5056 + - 448 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 1379.57 + - - - 704 + - 2944 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 3059.56 + - - - 2944 + - 1024 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 2929.52 + - - - 5888 + - 3584 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 11 + - 3978.03 + - - - 2944 + - 2368 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1856.26 + - - - 6784 + - 64 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 6 + - 1880.06 + - - - 2368 + - 704 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 17 + - 3227.24 + - - - 256 + - 5056 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 803.0 + - - - 6784 + - 256 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 1285.85 + - - - 1856 + - 704 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 2663.18 + - - - 3584 + - 704 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 12 + - 2805.43 + - - - 6784 + - 1856 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 17 + - 3942.17 + - - - 3584 + - 448 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3272.93 + - - - 5888 + - 3584 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 4032.36 + - - - 2944 + - 5056 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 4245.62 + - - - 64 + - 1408 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 900.182 + - - - 64 + - 1856 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 782.117 + - - - 2368 + - 128 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 3 + - 360.57 + - - - 1856 + - 4288 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 17 + - 3643.87 + - - - 5056 + - 4 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 25 + - 100.828 + - - - 1024 + - 6784 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 17 + - 3329.81 + - - - 5056 + - 5888 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4150.24 + - - - 1408 + - 256 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 2301.61 + - - - 448 + - 1024 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2902.84 + - - - 2944 + - 1024 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 3375.57 + - - - 1024 + - 2944 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1258.73 + - - - 2368 + - 6784 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 11 + - 3896.4 + - - - 5056 + - 3584 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4002.09 + - - - 1856 + - 1408 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 11 + - 3305.3 + - - - 4288 + - 2368 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2116.79 + - - - 704 + - 1408 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 2392.71 + - - - 4288 + - 4 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 25 + - 107.984 + - - - 4 + - 4 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 30 + - 0.463648 + - - - 2944 + - 2368 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 3959.24 + - - - 2368 + - 64 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 8 + - 1194.5 + - - - 704 + - 4 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 23 + - 6.76523 + - - - 128 + - 1856 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 1303.98 + - - - 2944 + - 1856 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 3785.45 + - - - 704 + - 64 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 707.256 + - - - 64 + - 6784 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 486.472 + - - - 5888 + - 2944 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 4023.13 + - - - 4 + - 4 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 30 + - 0.0973384 + - - - 2944 + - 64 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 18 + - 1563.73 + - - - 4288 + - 448 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 17 + - 3709.14 + - - - 5888 + - 5888 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 13 + - 3932.49 + - - - 1408 + - 6784 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3976.21 + - - - 1024 + - 704 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 685.751 + - - - 5888 + - 704 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 12 + - 3279.23 + - - - 2368 + - 448 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 6 + - 2655.51 + - - - 1408 + - 64 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 18 + - 636.553 + - - - 1024 + - 256 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 8 + - 1178.18 + - - - 5888 + - 3584 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2070.91 + - - - 2368 + - 6784 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 11 + - 3941.22 + - - - 1856 + - 256 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 8 + - 2747.77 + - - - 1408 + - 1024 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 3155.77 + - - - 2944 + - 4 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 27 + - 194.818 + - - - 128 + - 2944 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 413.533 + - - - 5888 + - 704 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1568.28 + - - - 448 + - 448 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 8 + - 1116.96 + - - - 4 + - 448 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 66.7989 + - - - 256 + - 1024 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 8 + - 1534.5 + - - - 3584 + - 5056 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2067.54 + - - - 2944 + - 5056 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 13 + - 4078.28 + - - - 1024 + - 2944 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 2892.62 + - - - 1856 + - 448 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 12 + - 2911.61 + - - - 5056 + - 448 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 12 + - 2938.1 + - - - 3584 + - 3584 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2006.85 + - - - 2368 + - 128 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 14 + - 2163.91 + - - - 4 + - 1024 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 9.60947 + - - - 5888 + - 128 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 12 + - 2134.27 + - - - 6784 + - 1856 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2043.18 + - - - 704 + - 64 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 3 + - 56.4523 + - - - 2944 + - 448 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 984.263 + - - - 4288 + - 64 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 8 + - 1602.52 + - - - 448 + - 1408 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 635.951 + - - - 256 + - 3584 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 12 + - 2528.87 + - - - 704 + - 448 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 3 + - 379.134 + - - - 5888 + - 4288 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 4081.74 + - - - 6784 + - 5888 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2254.19 + - - - 256 + - 1856 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 8 + - 2082.79 + - - - 2368 + - 704 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 17 + - 3376.66 + - - - 5056 + - 4 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 23 + - 46.2267 + - - - 5888 + - 448 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 12 + - 2936.01 + - - - 2368 + - 2368 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3427.0 + - - - 3584 + - 256 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 12 + - 3138.2 + - - - 1408 + - 1856 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 17 + - 3209.72 + - - - 2944 + - 128 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 8 + - 2207.19 + - - - 5056 + - 6784 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4363.07 + - - - 2368 + - 4 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 23 + - 21.8692 + - - - 5056 + - 256 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 12 + - 2882.31 + - - - 1856 + - 1024 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3292.77 + - - - 1408 + - 2944 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3176.36 + - - - 1408 + - 1856 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3334.09 + - - - 64 + - 3584 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 264.41 + - - - 5888 + - 256 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 11 + - 2654.62 + - - - 704 + - 2368 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 11 + - 3424.87 + - - - 64 + - 3584 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 1248.3 + - - - 6784 + - 5056 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2197.39 + - - - 1408 + - 128 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 6 + - 1508.6 + - - - 4288 + - 2944 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2219.83 + - - - 2368 + - 4 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 27 + - 174.198 + - - - 2944 + - 5056 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2086.36 + - - - 1024 + - 1856 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1165.53 + - - - 5056 + - 4288 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2220.47 + - - - 2944 + - 5888 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 11 + - 3805.55 + - - - 4288 + - 2368 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 17 + - 3504.4 + - - - 704 + - 1408 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 2501.25 + - - - 4288 + - 6784 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4079.5 + - - - 256 + - 704 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 1035.4 + - - - 64 + - 2368 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 187.681 + - - - 128 + - 4288 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2087.01 + - - - 448 + - 64 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 36.2363 + - - - 1856 + - 4288 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 3319.94 + - - - 4 + - 2368 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 30 + - 166.672 + - - - 5056 + - 448 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 12 + - 3134.62 + - - - 2944 + - 4288 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 17 + - 3705.41 + - - - 128 + - 256 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 703.742 + - - - 4288 + - 5888 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4105.95 + - - - 1856 + - 128 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 8 + - 2001.32 + - - - 6784 + - 1408 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3694.22 + - - - 1408 + - 2368 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 13 + - 3515.8 + - - - 64 + - 6784 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 8 + - 2428.63 + - - - 64 + - 64 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 42.7874 + - - - 6784 + - 2368 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3699.64 + - - - 64 + - 5888 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 6 + - 1845.71 + - - - 128 + - 448 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1135.42 + - - - 4288 + - 5888 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2285.9 + - - - 1024 + - 5056 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 17 + - 3528.76 + - - - 704 + - 4288 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 13 + - 3408.24 + - - - 4 + - 1856 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 17.1407 + - - - 4288 + - 6784 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4169.2 + - - - 128 + - 6784 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 12 + - 3040.19 + - - - 6784 + - 256 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3033.54 + - - - 1408 + - 704 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 2046.41 + - - - 64 + - 2368 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 866.011 + - - - 1408 + - 6784 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3986.03 + - - - 64 + - 5888 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 6 + - 2076.01 + - - - 5056 + - 64 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 8 + - 1464.6 + - - - 2944 + - 5888 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2157.85 + - - - 4 + - 5056 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 46.2928 + - - - 2944 + - 1408 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1610.94 + - - - 704 + - 4288 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 13 + - 3343.39 + - - - 6784 + - 4 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 25 + - 102.591 + - - - 1408 + - 448 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 4 + - 609.453 + - - - 2368 + - 5056 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 17 + - 3811.33 + - - - 1856 + - 4288 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 17 + - 3560.04 + - - - 4 + - 4288 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 29 + - 147.149 + - - - 6784 + - 5888 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 4089.07 + - - - 1024 + - 128 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 3 + - 162.444 + - - - 4 + - 4288 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 64.9543 + - - - 4 + - 128 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 20.0746 + - - - 4 + - 4288 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 30 + - 64.8543 + - - - 5888 + - 5056 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 4245.76 + - - - 4288 + - 1024 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 11 + - 3497.0 + - - - 3584 + - 64 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 18 + - 1692.55 + - - - 256 + - 2944 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 12 + - 2641.1 + - - - 6784 + - 5888 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 4127.14 + - - - 64 + - 5888 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 6 + - 1345.83 + - - - 1856 + - 5888 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 13 + - 3628.73 + - - - 704 + - 5056 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1729.98 + - - - 448 + - 256 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 16 + - 1548.03 + - - - 4 + - 5056 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 26 + - 165.235 + - - - 5056 + - 3584 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 11 + - 3772.45 + - - - 3584 + - 5888 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 4027.52 + - - - 64 + - 2944 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 225.648 + - - - 128 + - 5056 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 2436.81 + - - - 4 + - 3584 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 30 + - 80.5842 + - - - 64 + - 256 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 302.807 + - - - 5056 + - 2944 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4244.08 + - - - 1024 + - 448 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 8 + - 2586.04 + - - - 3584 + - 2368 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3858.79 + - - - 448 + - 5056 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 3099.6 + - - - 1856 + - 3584 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 11 + - 3842.95 + - - - 5056 + - 1408 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4051.83 + - - - 128 + - 3584 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 489.662 + - - - 5056 + - 704 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 3726.34 + - - - 1024 + - 6784 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 13 + - 3848.18 + - - - 5888 + - 5056 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2161.14 + - - - 5888 + - 1024 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 12 + - 3256.34 + - - - 1408 + - 5056 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1867.24 + - - - 2944 + - 5056 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 4198.68 + - - - 5888 + - 6784 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 4150.84 + - - - 1856 + - 704 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 12 + - 2925.96 + - - - 64 + - 4 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 27 + - 10.768 + - - - 704 + - 64 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 18 + - 471.688 + - - - 5056 + - 2944 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4204.34 + - - - 1856 + - 128 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 22 + - 2244.06 + - - - 5888 + - 2944 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 11 + - 3807.9 + - - - 5056 + - 1408 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 3861.29 + - - - 4 + - 5056 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 29 + - 73.8776 + - - - 3584 + - 6784 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 2122.21 + - - - 256 + - 1024 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 305.707 + - - - 2944 + - 4288 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 4023.15 + - - - 704 + - 2944 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 2922.98 + - - - 256 + - 5056 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 12 + - 2979.77 + - - - 1024 + - 5888 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 17 + - 3500.51 + - - - 3584 + - 4288 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 4355.2 + - - - 64 + - 2944 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 18 + - 1551.09 + - - - 1024 + - 2368 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 12 + - 3211.89 + - - - 1408 + - 6784 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 11 + - 3683.98 + - - - 2368 + - 2944 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 13 + - 3399.64 + - - - 6784 + - 128 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 12 + - 2992.47 + - - - 3584 + - 256 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 4 + - 858.483 + - - - 3584 + - 3584 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3862.76 + - - - 4 + - 1024 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 133.433 + - - - 448 + - 4 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 23 + - 4.40434 + - - - 4288 + - 3584 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4388.11 + - - - 4 + - 4 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 0.0353594 + - - - 5056 + - 1408 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4005.99 + - - - 64 + - 128 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 10 + - 258.172 + - - - 4 + - 64 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 7.7179 + - - - 1024 + - 1856 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 17 + - 3703.86 + - - - 5056 + - 64 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 8 + - 1890.69 + - - - 3584 + - 2944 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3632.51 + - - - 2368 + - 1408 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 13 + - 3559.59 + - - - 64 + - 256 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 171.898 + - - - 5056 + - 64 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 20 + - 2258.95 + - - - 448 + - 3584 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 11 + - 3321.78 + - - - 2944 + - 2368 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 13 + - 3770.87 + - - - 2944 + - 3584 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 3972.92 + - - - 2944 + - 704 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 2693.84 + - - - 1856 + - 2368 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 12 + - 3462.63 + - - - 64 + - 448 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 224.878 + - - - 2368 + - 2944 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 13 + - 3970.57 + - - - 4288 + - 1024 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 11 + - 3516.93 + - - - 2368 + - 256 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 8 + - 2341.62 + - - - 2368 + - 2368 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 17 + - 3871.12 + - - - 448 + - 4 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 27 + - 24.7885 + - - - 1024 + - 5888 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 3240.48 + - - - 6784 + - 64 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 3 + - 503.392 + - - - 256 + - 5888 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 17 + - 3087.43 + - - - 3584 + - 6784 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 4030.55 + - - - 1024 + - 5056 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 3615.11 + - - - 256 + - 256 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 18 + - 488.847 + - - - 1856 + - 1408 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3222.09 + - - - 5056 + - 2368 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2110.41 + - - - 6784 + - 5888 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 4164.62 + - - - 3584 + - 704 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3196.19 + - - - 1856 + - 1856 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 13 + - 3616.52 + - - - 256 + - 704 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 22 + - 1780.41 + - - - 64 + - 448 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 692.657 + - - - 1024 + - 4 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 27 + - 131.477 + - - - 3584 + - 1856 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3736.59 + - - - 3584 + - 128 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 8 + - 2997.81 + - - - 5888 + - 128 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 12 + - 2598.84 + - - - 4288 + - 64 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 8 + - 1267.22 + - - - 5056 + - 4 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 25 + - 78.2549 + - - - 64 + - 4288 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 8 + - 1704.74 + - - - 5888 + - 1856 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3567.28 + - - - 64 + - 448 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 38.3893 + - - - 3584 + - 3584 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3800.43 + - - - 2944 + - 4288 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2033.86 + - - - 6784 + - 4288 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 4027.08 + - - - 1408 + - 128 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 1028.02 + - - - 4288 + - 128 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 8 + - 1960.23 + - - - 704 + - 704 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 8 + - 1833.49 + - - - 4288 + - 1408 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 3270.14 + - - - 2944 + - 5888 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3992.16 + - - - 128 + - 1024 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 1121.04 + - - - 5888 + - 1856 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 4068.92 + - - - 2368 + - 256 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 8 + - 1838.74 + - - - 256 + - 256 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 81.984 + - - - 1408 + - 256 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 20 + - 2415.76 + - - - 6784 + - 4288 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2209.21 + - - - 2944 + - 128 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 8 + - 2469.08 + - - - 256 + - 6784 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 17 + - 3599.03 + - - - 1024 + - 4288 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1517.71 + - - - 256 + - 448 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 18 + - 1286.44 + - - - 4 + - 704 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 67.1761 + - - - 6784 + - 704 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 1665.91 + - - - 6784 + - 448 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 3363.58 + - - - 1024 + - 128 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 1056.5 + - - - 1408 + - 4 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 27 + - 179.123 + - - - 1024 + - 64 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 3 + - 82.7605 + - - - 704 + - 1856 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 2947.22 + - - - 1024 + - 4 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 30 + - 48.0117 + - - - 704 + - 448 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 2007.04 + - - - 1024 + - 704 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 2036.07 + - - - 2368 + - 2368 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1979.68 + - - - 1024 + - 5056 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1562.97 + - - - 2944 + - 3584 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3902.17 + - - - 1408 + - 2944 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3292.32 + - - - 64 + - 1024 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 496.955 + - - - 128 + - 5056 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2266.62 + - - - 4288 + - 128 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 8 + - 1658.51 + - - - 5056 + - 1856 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 11 + - 3833.44 + - - - 2368 + - 1856 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 12 + - 3350.97 + - - - 2368 + - 1024 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 6 + - 3223.71 + - - - 1856 + - 448 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 2382.06 + - - - 4288 + - 6784 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2287.61 + - - - 256 + - 1856 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 505.464 + - - - 256 + - 256 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 16 + - 1030.35 + - - - 128 + - 4288 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1943.6 + - - - 1024 + - 2368 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 3098.83 + - - - 4 + - 64 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 4.28153 + - - - 2944 + - 2944 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 11 + - 3874.66 + - - - 1856 + - 1856 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1674.75 + - - - 64 + - 2944 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 1396.75 + - - - 448 + - 4288 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 11 + - 3691.32 + - - - 5888 + - 704 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 3302.66 + - - - 3584 + - 2944 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1945.39 + - - - 6784 + - 3584 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3866.25 + - - - 1024 + - 6784 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1645.92 + - - - 1408 + - 5056 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 13 + - 3826.91 + - - - 64 + - 704 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 55.0723 + - - - 1024 + - 704 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 2545.27 + - - - 128 + - 1408 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1425.17 + - - - 2368 + - 3584 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 11 + - 3861.69 + - - - 64 + - 2944 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 15 + - 1807.68 + - - - 4 + - 448 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 46.0859 + - - - 448 + - 1024 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 8 + - 2019.27 + - - - 4288 + - 1856 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3540.4 + - - - 2944 + - 2368 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 13 + - 3904.76 + - - - 3584 + - 1408 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3497.09 + - - - 2944 + - 256 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 755.553 + - - - 704 + - 6784 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1932.6 + - - - 1856 + - 6784 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 11 + - 4008.71 + - - - 5888 + - 5888 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2192.74 + - - - 3584 + - 4288 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 13 + - 4142.02 + - - - 1024 + - 448 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 6 + - 1965.2 + - - - 2368 + - 4288 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 13 + - 3857.27 + - - - 128 + - 4288 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1638.4 + - - - 4288 + - 704 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 3348.03 + - - - 1856 + - 1024 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 11 + - 3878.66 + - - - 256 + - 448 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 19 + - 1519.92 + - - - 64 + - 2944 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 18 + - 1057.77 + - - - 64 + - 1856 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 19 + - 1518.57 + - - - 64 + - 3584 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 15 + - 2147.66 + - - - 1408 + - 5056 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3354.98 + - - - 128 + - 6784 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 12 + - 2845.11 + - - - 4288 + - 256 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 834.774 + - - - 2368 + - 1408 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1625.92 + - - - 448 + - 4 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 27 + - 64.6553 + - - - 704 + - 704 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 486.494 + - - - 5888 + - 4 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 28 + - 86.9278 + - - - 4 + - 256 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 30 + - 5.67903 + - - - 5888 + - 5056 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 4203.84 + - - - 256 + - 2368 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 6 + - 2165.03 + - - - 4288 + - 3584 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4348.15 + - - - 128 + - 2944 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 2425.53 + - - - 3584 + - 4 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 27 + - 134.927 + - - - 1856 + - 1408 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3341.36 + - - - 256 + - 128 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 18 + - 256.376 + - - - 256 + - 5056 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 12 + - 2614.82 + - - - 5888 + - 256 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 17 + - 3119.18 + - - - 5888 + - 4 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 26 + - 183.373 + - - - 2944 + - 128 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 3 + - 451.972 + - - - 4288 + - 5056 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2224.03 + - - - 6784 + - 704 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 17 + - 3708.87 + - - - 1856 + - 5888 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 13 + - 4156.02 + - - - 5888 + - 448 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 3250.3 + - - - 1408 + - 5888 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1957.86 + - - - 448 + - 4288 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 11 + - 3867.95 + - - - 64 + - 1024 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 745.559 + - - - 704 + - 1856 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 8 + - 2897.86 + - - - 2944 + - 6784 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 3982.55 + - - - 448 + - 6784 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1508.3 + - - - 448 + - 5056 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 3051.36 + - - - 2944 + - 448 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 2684.81 + - - - 256 + - 5056 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 2903.45 + - - - 256 + - 1024 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 1737.05 + - - - 1024 + - 64 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 18 + - 682.37 + - - - 448 + - 4288 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 11 + - 3188.42 + - - - 3584 + - 64 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 18 + - 1261.17 + - - - 5056 + - 5056 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4050.28 + - - - 4288 + - 1024 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3420.66 + - - - 4 + - 1408 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 12.4122 + - - - 128 + - 2368 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1358.45 + - - - 5056 + - 1024 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 3646.2 + - - - 2368 + - 448 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 8 + - 2643.9 + - - - 448 + - 704 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 6 + - 1433.6 + - - - 5888 + - 448 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 2 + - 1265.9 + - - - 448 + - 5056 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 12 + - 3044.65 + - - - 2368 + - 3584 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 11 + - 3808.28 + - - - 256 + - 1408 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 8 + - 2378.22 + - - - 6784 + - 2944 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 3981.55 + - - - 256 + - 2368 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 22 + - 2396.49 + - - - 1856 + - 256 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 8 + - 2102.95 + - - - 448 + - 3584 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1277.48 + - - - 4288 + - 256 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 7 + - 2826.19 + - - - 1024 + - 1024 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 6 + - 2384.26 + - - - 1024 + - 3584 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 17 + - 3302.6 + - - - 256 + - 3584 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 774.674 + - - - 6784 + - 4 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 26 + - 66.9749 + - - - 704 + - 2944 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2691.66 + - - - 2368 + - 5888 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 11 + - 3638.34 + - - - 1408 + - 4288 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3490.16 + - - - 2368 + - 704 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 17 + - 3438.97 + - - - 448 + - 2944 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2674.6 + - - - 3584 + - 1024 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 13 + - 3831.25 + - - - 4288 + - 1024 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 3338.3 + - - - 256 + - 128 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 711.084 + - - - 6784 + - 6784 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 4391.67 + - - - 4288 + - 4288 + - 1 + - 128 + - 4288 + - 4288 + - 128 + - 128 + - - 0 + - 2232.95 + - - - 2368 + - 128 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 8 + - 1757.12 + - - - 4 + - 1856 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 146.777 + - - - 2368 + - 4288 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2101.73 + - - - 4 + - 6784 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 30 + - 70.3341 + - - - 256 + - 3584 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 12 + - 3158.95 + - - - 704 + - 1856 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2648.0 + - - - 128 + - 128 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 126.334 + - - - 1024 + - 1408 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 2816.69 + - - - 5888 + - 64 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 3 + - 449.278 + - - - 256 + - 1024 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 1680.12 + - - - 5888 + - 1408 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 3788.44 + - - - 5888 + - 1856 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 1951.45 + - - - 704 + - 128 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 18 + - 629.604 + - - - 3584 + - 128 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 3 + - 506.558 + - - - 5056 + - 128 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 650.42 + - - - 2944 + - 2944 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 2027.7 + - - - 1856 + - 1408 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1610.01 + - - - 64 + - 4288 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 8 + - 1534.39 + - - - 2944 + - 5056 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 17 + - 3655.81 + - - - 2368 + - 256 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 608.872 + - - - 4288 + - 448 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 17 + - 3941.92 + - - - 128 + - 64 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 18 + - 63.3198 + - - - 128 + - 1408 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 22 + - 1777.04 + - - - 1856 + - 6784 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 2231.48 + - - - 4 + - 4288 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 30 + - 80.7835 + - - - 2368 + - 5888 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 13 + - 3949.4 + - - - 6784 + - 64 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 6 + - 2472.18 + - - - 3584 + - 5056 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 13 + - 4056.65 + - - - 1856 + - 448 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 814.685 + - - - 4288 + - 2368 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 11 + - 3735.52 + - - - 2944 + - 128 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 8 + - 1681.82 + - - - 6784 + - 6784 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 4266.96 + - - - 1856 + - 1856 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 13 + - 3813.49 + - - - 1408 + - 4 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 23 + - 13.213 + - - - 1024 + - 4288 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 12 + - 3308.43 + - - - 5056 + - 3584 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2238.34 + - - - 5056 + - 2368 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 11 + - 3751.09 + - - - 448 + - 3584 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 11 + - 3156.68 + - - - 2944 + - 64 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 6 + - 1076.66 + - - - 4 + - 256 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 27.7695 + - - - 2368 + - 256 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 8 + - 2183.71 + - - - 3584 + - 5888 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3981.7 + - - - 256 + - 5888 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 11 + - 2973.77 + - - - 5888 + - 1408 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 11 + - 3721.45 + - - - 1024 + - 2368 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 3106.56 + - - - 256 + - 448 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 146.449 + - - - 128 + - 6784 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 773.157 + - - - 3584 + - 4288 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 17 + - 3759.52 + - - - 5056 + - 4 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 27 + - 167.95 + - - - 2368 + - 5056 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 17 + - 3745.47 + - - - 5056 + - 2944 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2170.2 + - - - 2368 + - 448 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 844.469 + - - - 128 + - 5888 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 12 + - 2113.69 + - - - 448 + - 64 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 18 + - 303.14 + - - - 256 + - 5888 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 17 + - 3129.61 + - - - 4 + - 1856 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 30 + - 205.209 + - - - 2368 + - 5056 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 2121.4 + - - - 448 + - 1408 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2471.5 + - - - 5056 + - 128 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 9 + - 2525.06 + - - - 5888 + - 6784 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 13 + - 4106.76 + - - - 4288 + - 64 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 20 + - 1995.87 + - - - 448 + - 1024 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 3007.74 + - - - 4 + - 448 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 27 + - 9.30909 + - - - 5888 + - 2368 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2023.26 + - - - 5888 + - 704 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 12 + - 3174.08 + - - - 4 + - 256 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 14.9171 + - - - 1856 + - 1024 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1435.05 + - - - 6784 + - 4288 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3869.61 + - - - 704 + - 4288 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2933.5 + - - - 128 + - 2368 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 20 + - 2101.52 + - - - 448 + - 1856 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 12 + - 2379.93 + - - - 5888 + - 64 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 8 + - 2393.26 + - - - 1024 + - 64 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 5 + - 967.458 + - - - 4288 + - 5056 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4033.91 + - - - 128 + - 5888 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 12 + - 2641.32 + - - - 256 + - 256 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 18 + - 766.984 + - - - 1856 + - 1408 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 2918.81 + - - - 5056 + - 6784 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 1 + - 2324.24 + - - - 1856 + - 128 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 3 + - 286.011 + - - - 256 + - 64 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 20.7228 + - - - 6784 + - 128 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 12 + - 2854.86 + - - - 256 + - 2368 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 6 + - 1786.25 + - - - 2368 + - 6784 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 11 + - 3917.33 + - - - 64 + - 1408 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 117.505 + - - - 5056 + - 1856 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3590.65 + - - - 4 + - 128 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 29 + - 3.25726 + - - - 1856 + - 1856 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 13 + - 3886.13 + - - - 448 + - 128 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 70.6316 + - - - 64 + - 4288 + - 1 + - 256 + - 64 + - 64 + - 256 + - 256 + - - 6 + - 1149.45 + - - - 128 + - 256 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 18 + - 351.871 + - - - 64 + - 128 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 165.914 + - - - 2944 + - 128 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 8 + - 2400.07 + - - - 4 + - 64 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 10.5861 + - - - 704 + - 3584 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 2819.15 + - - - 1408 + - 5888 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 11 + - 3776.06 + - - - 6784 + - 1024 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 3796.29 + - - - 5056 + - 1024 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 1847.4 + - - - 6784 + - 4288 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 4118.83 + - - - 448 + - 3584 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 11 + - 3281.29 + - - - 1856 + - 64 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 16 + - 1638.94 + - - - 3584 + - 1408 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 3547.47 + - - - 5056 + - 2944 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 13 + - 3719.76 + - - - 2944 + - 4 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 26 + - 212.438 + - - - 128 + - 1856 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 1942.87 + - - - 1856 + - 448 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 12 + - 2875.17 + - - - 5888 + - 128 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 12 + - 2476.1 + - - - 5888 + - 1024 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 3432.86 + - - - 3584 + - 2944 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3954.77 + - - - 128 + - 5056 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1905.19 + - - - 256 + - 5888 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 17 + - 2644.44 + - - - 6784 + - 2368 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 17 + - 3882.47 + - - - 4288 + - 3584 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4244.5 + - - - 128 + - 1024 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 5 + - 1398.46 + - - - 448 + - 4 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 27 + - 9.40066 + - - - 5056 + - 128 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 6 + - 1887.82 + - - - 4 + - 5888 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 82.2777 + - - - 448 + - 2368 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 8 + - 2746.92 + - - - 256 + - 704 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 8 + - 1427.52 + - - - 1856 + - 2368 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 17 + - 3481.2 + - - - 256 + - 64 + - 1 + - 3328 + - 256 + - 256 + - 3328 + - 3328 + - - 5 + - 456.513 + - - - 1408 + - 448 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 2289.42 + - - - 4 + - 2368 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 26 + - 205.978 + - - - 6784 + - 3584 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 17 + - 4021.59 + - - - 64 + - 64 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 10 + - 139.438 + - - - 3584 + - 256 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 12 + - 2577.71 + - - - 704 + - 64 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 18 + - 344.103 + - - - 3584 + - 448 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1121.35 + - - - 1856 + - 704 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1018.31 + - - - 128 + - 3584 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 2590.6 + - - - 704 + - 4 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 27 + - 95.7072 + - - - 5056 + - 4288 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 13 + - 4135.36 + - - - 4 + - 64 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 0.571274 + - - - 2368 + - 448 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 8 + - 2503.51 + - - - 704 + - 3584 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1544.97 + - - - 1408 + - 1856 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 2902.6 + - - - 4 + - 2944 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 26 + - 47.7607 + - - - 1024 + - 4288 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 12 + - 3441.89 + - - - 448 + - 4288 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 11 + - 3956.37 + - - - 704 + - 128 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 5 + - 1021.51 + - - - 3584 + - 704 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3095.87 + - - - 256 + - 64 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 18 + - 171.336 + - - - 704 + - 6784 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 11 + - 3707.07 + - - - 5056 + - 4288 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4001.41 + - - - 2368 + - 3584 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 17 + - 3788.23 + - - - 5056 + - 2368 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 11 + - 3830.18 + - - - 2944 + - 4 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 30 + - 119.503 + - - - 128 + - 256 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 517.998 + - - - 5056 + - 3584 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4108.88 + - - - 704 + - 6784 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 11 + - 3783.06 + - - - 704 + - 4 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 27 + - 13.7786 + - - - 128 + - 2944 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 1627.34 + - - - 256 + - 6784 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 11 + - 3396.28 + - - - 3584 + - 704 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3228.52 + - - - 2944 + - 4 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 29 + - 49.9777 + - - - 64 + - 256 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 5 + - 436.068 + - - - 1024 + - 2368 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 12 + - 3324.06 + - - - 256 + - 1856 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 3001.42 + - - - 2368 + - 4288 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 13 + - 3816.46 + - - - 704 + - 128 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 18 + - 917.365 + - - - 6784 + - 2368 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 3941.26 + - - - 704 + - 1408 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 818.777 + - - - 5056 + - 256 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 12 + - 3009.58 + - - - 5888 + - 5056 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3860.72 + - - - 4 + - 1856 + - 1 + - 256 + - 4 + - 4 + - 256 + - 256 + - - 29 + - 31.5077 + - - - 5888 + - 4288 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 17 + - 4031.31 + - - - 4 + - 2944 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 26 + - 113.732 + - - - 1856 + - 3584 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 2014.59 + - - - 64 + - 1856 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 1108.19 + - - - 2368 + - 2944 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1952.09 + - - - 5056 + - 1856 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 17 + - 3910.92 + - - - 1408 + - 448 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 6 + - 1845.07 + - - - 4288 + - 128 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 7 + - 2448.55 + - - - 1856 + - 2368 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 12 + - 3341.42 + - - - 5056 + - 5056 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4142.27 + - - - 3584 + - 448 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 17 + - 3137.4 + - - - 448 + - 448 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 244.388 + - - - 256 + - 4 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 30 + - 5.82025 + - - - 256 + - 1856 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 8 + - 2710.22 + - - - 1408 + - 3584 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 13 + - 3512.42 + - - - 4 + - 5056 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 80.0529 + - - - 256 + - 4288 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 12 + - 2234.56 + - - - 64 + - 448 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 466.076 + - - - 3584 + - 4 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 26 + - 58.8144 + - - - 64 + - 5888 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 416.965 + - - - 1408 + - 1408 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1181.8 + - - - 4288 + - 256 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 8 + - 2720.64 + - - - 6784 + - 3584 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 4055.35 + - - - 3584 + - 64 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 3 + - 271.25 + - - - 1408 + - 1408 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 2899.21 + - - - 1408 + - 1408 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 2771.47 + - - - 64 + - 1856 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 18 + - 1191.56 + - - - 448 + - 64 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 715.94 + - - - 128 + - 64 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 5 + - 172.14 + - - - 6784 + - 5056 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 4358.37 + - - - 704 + - 3584 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 8 + - 3103.29 + - - - 448 + - 2944 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 12 + - 2944.55 + - - - 1408 + - 256 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 8 + - 1622.27 + - - - 448 + - 1856 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 12 + - 2914.06 + - - - 3584 + - 1408 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1567.47 + - - - 1856 + - 4 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 23 + - 17.0914 + - - - 4 + - 128 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 24 + - 1.15381 + - - - 128 + - 64 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 10 + - 273.067 + - - - 4 + - 5056 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 30 + - 68.6962 + - - - 128 + - 1408 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 6 + - 1509.17 + - - - 2944 + - 2944 + - 1 + - 1792 + - 2944 + - 2944 + - 1792 + - 1792 + - - 17 + - 3943.29 + - - - 4 + - 1856 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 79.8101 + - - - 256 + - 4 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 23 + - 2.54018 + - - - 6784 + - 1024 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 1865.86 + - - - 3584 + - 64 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 22 + - 2028.93 + - - - 128 + - 3584 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 6 + - 2936.92 + - - - 5888 + - 256 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 11 + - 3080.95 + - - - 448 + - 1856 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 12 + - 2866.32 + - - - 448 + - 256 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 18 + - 752.052 + - - - 4288 + - 4288 + - 1 + - 768 + - 4288 + - 4288 + - 768 + - 768 + - - 13 + - 4067.72 + - - - 256 + - 6784 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 17 + - 3547.2 + - - - 4288 + - 4288 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 13 + - 4149.76 + - - - 4 + - 704 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 97.0557 + - - - 6784 + - 1856 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 17 + - 4013.96 + - - - 1856 + - 5056 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 17 + - 3845.39 + - - - 5056 + - 128 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 8 + - 2299.34 + - - - 1408 + - 1856 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 1554.93 + - - - 1856 + - 3584 + - 1 + - 256 + - 1856 + - 1856 + - 256 + - 256 + - - 11 + - 3492.96 + - - - 6784 + - 5056 + - 1 + - 768 + - 6784 + - 6784 + - 768 + - 768 + - - 13 + - 4235.92 + - - - 128 + - 4 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 29 + - 3.25726 + - - - 704 + - 2368 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 17 + - 3220.1 + - - - 704 + - 2944 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 0 + - 1285.32 + - - - 1024 + - 256 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 3 + - 303.276 + - - - 5056 + - 5056 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3770.72 + - - - 4288 + - 1408 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 11 + - 3517.65 + - - - 1024 + - 64 + - 1 + - 256 + - 1024 + - 1024 + - 256 + - 256 + - - 18 + - 480.998 + - - - 2368 + - 1408 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 13 + - 3782.09 + - - - 5056 + - 128 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 8 + - 2456.63 + - - - 128 + - 448 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 70.7951 + - - - 128 + - 6784 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 12 + - 2414.18 + - - - 4 + - 1408 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 120.494 + - - - 2368 + - 1024 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 0 + - 1491.06 + - - - 4288 + - 64 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 8 + - 1757.37 + - - - 2944 + - 256 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 12 + - 2475.26 + - - - 2944 + - 704 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1238.75 + - - - 256 + - 3584 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 12 + - 3001.04 + - - - 5056 + - 448 + - 1 + - 3328 + - 5056 + - 5056 + - 3328 + - 3328 + - - 8 + - 3075.92 + - - - 5888 + - 4288 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 0 + - 2107.82 + - - - 5056 + - 6784 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 13 + - 3953.88 + - - - 1024 + - 448 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 8 + - 2864.0 + - - - 4 + - 5888 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 69.9434 + - - - 3584 + - 3584 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 17 + - 3843.46 + - - - 6784 + - 4 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 28 + - 100.041 + - - - 2944 + - 64 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 18 + - 1409.82 + - - - 256 + - 4288 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 2708.35 + - - - 448 + - 2368 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 8 + - 2683.31 + - - - 256 + - 4 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 27 + - 15.2409 + - - - 448 + - 3584 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 11 + - 2821.54 + - - - 448 + - 1024 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 8 + - 2659.43 + - - - 5888 + - 1856 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 13 + - 3926.72 + - - - 1408 + - 4 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 27 + - 124.17 + - - - 448 + - 2944 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1033.93 + - - - 64 + - 5056 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 8 + - 1704.94 + - - - 6784 + - 128 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 4 + - 771.012 + - - - 1024 + - 1856 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 3913.99 + - - - 1856 + - 4 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 27 + - 152.287 + - - - 128 + - 1024 + - 1 + - 256 + - 128 + - 128 + - 256 + - 256 + - - 6 + - 773.857 + - - - 6784 + - 1024 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 3955.21 + - - - 1024 + - 3584 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 13 + - 3754.09 + - - - 1024 + - 256 + - 1 + - 768 + - 1024 + - 1024 + - 768 + - 768 + - - 8 + - 1531.7 + - - - 4288 + - 1856 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 12 + - 3329.06 + - - - 6784 + - 256 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 11 + - 3550.12 + - - - 1024 + - 704 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 6 + - 2693.14 + - - - 704 + - 6784 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 11 + - 3347.13 + - - - 2368 + - 1408 + - 1 + - 1792 + - 2368 + - 2368 + - 1792 + - 1792 + - - 13 + - 3728.09 + - - - 2944 + - 1024 + - 1 + - 128 + - 2944 + - 2944 + - 128 + - 128 + - - 0 + - 1428.33 + - - - 4288 + - 448 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 17 + - 3218.47 + - - - 1024 + - 2944 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 13 + - 3339.02 + - - - 128 + - 4 + - 1 + - 1792 + - 128 + - 128 + - 1792 + - 1792 + - - 27 + - 14.4808 + - - - 64 + - 5888 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 6 + - 2227.37 + - - - 1408 + - 64 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 16 + - 1406.1 + - - - 256 + - 128 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 40.5796 + - - - 2944 + - 1408 + - 1 + - 256 + - 2944 + - 2944 + - 256 + - 256 + - - 12 + - 3175.6 + - - - 1408 + - 3584 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 13 + - 3560.83 + - - - 1408 + - 64 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 18 + - 909.648 + - - - 1856 + - 256 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 8 + - 3011.61 + - - - 5888 + - 6784 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3932.12 + - - - 3584 + - 1856 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 17 + - 3873.56 + - - - 5056 + - 256 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 12 + - 2982.83 + - - - 448 + - 128 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 5 + - 803.821 + - - - 2368 + - 4288 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 17 + - 3745.13 + - - - 1856 + - 5888 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 2112.74 + - - - 3584 + - 128 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 8 + - 2000.01 + - - - 4 + - 4 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 30 + - 0.255574 + - - - 1408 + - 2368 + - 1 + - 256 + - 1408 + - 1408 + - 256 + - 256 + - - 12 + - 3201.1 + - - - 4288 + - 4 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 29 + - 65.3711 + - - - 4 + - 4 + - 1 + - 3328 + - 4 + - 4 + - 3328 + - 3328 + - - 27 + - 0.646846 + - - - 256 + - 1408 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 8 + - 2297.68 + - - - 256 + - 64 + - 1 + - 1792 + - 256 + - 256 + - 1792 + - 1792 + - - 5 + - 318.855 + - - - 1408 + - 256 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 8 + - 2095.88 + - - - 1856 + - 64 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 18 + - 1144.91 + - - - 128 + - 1856 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1784.55 + - - - 704 + - 256 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 8 + - 1028.02 + - - - 3584 + - 5888 + - 1 + - 256 + - 3584 + - 3584 + - 256 + - 256 + - - 11 + - 3796.07 + - - - 256 + - 1408 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 8 + - 2121.58 + - - - 1856 + - 4288 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 17 + - 3622.0 + - - - 256 + - 2944 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 12 + - 2469.34 + - - - 1856 + - 704 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 6 + - 2857.36 + - - - 448 + - 5888 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 11 + - 3337.89 + - - - 64 + - 4288 + - 1 + - 3328 + - 64 + - 64 + - 3328 + - 3328 + - - 14 + - 1916.79 + - - - 448 + - 6784 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 13 + - 3429.41 + - - - 5888 + - 2944 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 17 + - 4037.31 + - - - 704 + - 5888 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 12 + - 3163.48 + - - - 5888 + - 2368 + - 1 + - 1792 + - 5888 + - 5888 + - 1792 + - 1792 + - - 13 + - 3922.22 + - - - 4 + - 5888 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 29 + - 180.735 + - - - 2368 + - 64 + - 1 + - 128 + - 2368 + - 2368 + - 128 + - 128 + - - 3 + - 183.006 + - - - 64 + - 128 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 5 + - 88.8624 + - - - 1856 + - 1024 + - 1 + - 3328 + - 1856 + - 1856 + - 3328 + - 3328 + - - 11 + - 3927.6 + - - - 1408 + - 4288 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 17 + - 3437.32 + - - - 2368 + - 256 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 14 + - 2652.88 + - - - 256 + - 6784 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 1206.57 + - - - 5888 + - 64 + - 1 + - 768 + - 5888 + - 5888 + - 768 + - 768 + - - 8 + - 2166.22 + - - - 704 + - 256 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 22 + - 1771.58 + - - - 128 + - 1408 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 217.958 + - - - 5888 + - 4288 + - 1 + - 256 + - 5888 + - 5888 + - 256 + - 256 + - - 17 + - 3883.9 + - - - 1856 + - 5888 + - 1 + - 1792 + - 1856 + - 1856 + - 1792 + - 1792 + - - 13 + - 4110.25 + - - - 1408 + - 2944 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 12 + - 3259.36 + - - - 6784 + - 6784 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2246.59 + - - - 448 + - 5056 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 1412.92 + - - - 448 + - 2368 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 0 + - 809.434 + - - - 1856 + - 6784 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 11 + - 3964.27 + - - - 2944 + - 3584 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 13 + - 4013.88 + - - - 1408 + - 5056 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 13 + - 3986.16 + - - - 1408 + - 704 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 0 + - 756.666 + - - - 1408 + - 6784 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 11 + - 3931.66 + - - - 4288 + - 3584 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 13 + - 3817.3 + - - - 128 + - 1024 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 6 + - 1057.39 + - - - 3584 + - 256 + - 1 + - 768 + - 3584 + - 3584 + - 768 + - 768 + - - 12 + - 2968.67 + - - - 4 + - 448 + - 1 + - 768 + - 4 + - 4 + - 768 + - 768 + - - 27 + - 24.3327 + - - - 128 + - 64 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 10.3943 + - - - 2368 + - 64 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 6 + - 886.593 + - - - 6784 + - 6784 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 11 + - 3957.45 + - - - 64 + - 1024 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 682.37 + - - - 256 + - 1408 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 3 + - 404.146 + - - - 128 + - 4288 + - 1 + - 3328 + - 128 + - 128 + - 3328 + - 3328 + - - 20 + - 2361.69 + - - - 704 + - 4288 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 13 + - 3163.07 + - - - 256 + - 4288 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 796.176 + - - - 6784 + - 6784 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 4355.54 + - - - 448 + - 128 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 18 + - 594.495 + - - - 3584 + - 5056 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 4118.95 + - - - 704 + - 5056 + - 1 + - 256 + - 704 + - 704 + - 256 + - 256 + - - 11 + - 3112.92 + - - - 5888 + - 2368 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 13 + - 3971.76 + - - - 6784 + - 5056 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 17 + - 3921.25 + - - - 5888 + - 128 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 4 + - 690.247 + - - - 1024 + - 1856 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 17 + - 3870.2 + - - - 1856 + - 4 + - 1 + - 768 + - 1856 + - 1856 + - 768 + - 768 + - - 27 + - 83.9463 + - - - 64 + - 704 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 5 + - 650.293 + - - - 448 + - 128 + - 1 + - 3328 + - 448 + - 448 + - 3328 + - 3328 + - - 5 + - 1125.77 + - - - 1024 + - 128 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 22 + - 1301.34 + - - - 6784 + - 128 + - 1 + - 256 + - 6784 + - 6784 + - 256 + - 256 + - - 12 + - 2461.23 + - - - 256 + - 5056 + - 1 + - 768 + - 256 + - 256 + - 768 + - 768 + - - 12 + - 2887.0 + - - - 4288 + - 5056 + - 1 + - 3328 + - 4288 + - 4288 + - 3328 + - 3328 + - - 13 + - 4132.33 + - - - 1408 + - 128 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 3 + - 226.697 + - - - 1408 + - 1024 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 2991.75 + - - - 5056 + - 704 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 1713.84 + - - - 448 + - 5888 + - 1 + - 768 + - 448 + - 448 + - 768 + - 768 + - - 11 + - 3235.36 + - - - 6784 + - 1024 + - 1 + - 1792 + - 6784 + - 6784 + - 1792 + - 1792 + - - 13 + - 3907.02 + - - - 128 + - 4 + - 1 + - 768 + - 128 + - 128 + - 768 + - 768 + - - 27 + - 7.81431 + - - - 6784 + - 4 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 23 + - 62.2034 + - - - 5056 + - 6784 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 4333.83 + - - - 2368 + - 1856 + - 1 + - 768 + - 2368 + - 2368 + - 768 + - 768 + - - 12 + - 3420.8 + - - - 1408 + - 704 + - 1 + - 1792 + - 1408 + - 1408 + - 1792 + - 1792 + - - 8 + - 2476.98 + - - - 6784 + - 704 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 17 + - 3822.88 + - - - 256 + - 1408 + - 1 + - 256 + - 256 + - 256 + - 256 + - 256 + - - 8 + - 1613.19 + - - - 5056 + - 5888 + - 1 + - 128 + - 5056 + - 5056 + - 128 + - 128 + - - 0 + - 2267.63 + - - - 64 + - 448 + - 1 + - 768 + - 64 + - 64 + - 768 + - 768 + - - 18 + - 304.481 + - - - 1408 + - 64 + - 1 + - 128 + - 1408 + - 1408 + - 128 + - 128 + - - 3 + - 112.905 + - - - 1408 + - 4 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 27 + - 66.7496 + - - - 704 + - 5888 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 12 + - 3278.42 + - - - 4 + - 2368 + - 1 + - 128 + - 4 + - 4 + - 128 + - 128 + - - 23 + - 21.7437 + - - - 448 + - 128 + - 1 + - 256 + - 448 + - 448 + - 256 + - 256 + - - 18 + - 440.05 + - - - 2944 + - 1024 + - 1 + - 768 + - 2944 + - 2944 + - 768 + - 768 + - - 13 + - 3237.94 + - - - 3584 + - 64 + - 1 + - 1792 + - 3584 + - 3584 + - 1792 + - 1792 + - - 18 + - 1895.95 + - - - 256 + - 5888 + - 1 + - 128 + - 256 + - 256 + - 128 + - 128 + - - 0 + - 1061.5 + - - - 4288 + - 5056 + - 1 + - 256 + - 4288 + - 4288 + - 256 + - 256 + - - 17 + - 3734.33 + - - - 3584 + - 704 + - 1 + - 128 + - 3584 + - 3584 + - 128 + - 128 + - - 0 + - 1237.59 + - - - 448 + - 704 + - 1 + - 128 + - 448 + - 448 + - 128 + - 128 + - - 3 + - 373.521 + - - - 5888 + - 1024 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 11 + - 3513.81 + - - - 448 + - 256 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 18 + - 1300.77 + - - - 4 + - 5888 + - 1 + - 1792 + - 4 + - 4 + - 1792 + - 1792 + - - 27 + - 92.1515 + - - - 3584 + - 2944 + - 1 + - 3328 + - 3584 + - 3584 + - 3328 + - 3328 + - - 13 + - 3993.0 + - - - 5056 + - 1024 + - 1 + - 1792 + - 5056 + - 5056 + - 1792 + - 1792 + - - 13 + - 3596.05 + - - - 1024 + - 4288 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 17 + - 3516.59 + - - - 128 + - 5888 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 0 + - 671.416 + - - - 64 + - 5056 + - 1 + - 128 + - 64 + - 64 + - 128 + - 128 + - - 3 + - 373.815 + - - - 1408 + - 4288 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 11 + - 3490.96 + - - - 5056 + - 4288 + - 1 + - 256 + - 5056 + - 5056 + - 256 + - 256 + - - 17 + - 3731.32 + - - - 2944 + - 5888 + - 1 + - 3328 + - 2944 + - 2944 + - 3328 + - 3328 + - - 17 + - 4048.09 + - - - 704 + - 3584 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 11 + - 3101.42 + - - - 5888 + - 128 + - 1 + - 3328 + - 5888 + - 5888 + - 3328 + - 3328 + - - 12 + - 2640.87 + - - - 448 + - 448 + - 1 + - 1792 + - 448 + - 448 + - 1792 + - 1792 + - - 6 + - 1731.14 + - - - 64 + - 5056 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 8 + - 1963.24 + - - - 2368 + - 448 + - 1 + - 256 + - 2368 + - 2368 + - 256 + - 256 + - - 12 + - 2165.03 + - - - 2368 + - 5888 + - 1 + - 3328 + - 2368 + - 2368 + - 3328 + - 3328 + - - 13 + - 3985.49 + - - - 1024 + - 3584 + - 1 + - 3328 + - 1024 + - 1024 + - 3328 + - 3328 + - - 13 + - 4105.76 + - - - 1408 + - 1024 + - 1 + - 768 + - 1408 + - 1408 + - 768 + - 768 + - - 12 + - 3216.64 + - - - 128 + - 128 + - 1 + - 128 + - 128 + - 128 + - 128 + - 128 + - - 3 + - 20.7228 + - - - 5056 + - 6784 + - 1 + - 768 + - 5056 + - 5056 + - 768 + - 768 + - - 13 + - 4246.74 + - - - 1408 + - 448 + - 1 + - 3328 + - 1408 + - 1408 + - 3328 + - 3328 + - - 20 + - 2385.51 + - - - 6784 + - 4288 + - 1 + - 3328 + - 6784 + - 6784 + - 3328 + - 3328 + - - 13 + - 4157.67 + - - - 1024 + - 5888 + - 1 + - 128 + - 1024 + - 1024 + - 128 + - 128 + - - 0 + - 1585.36 + - - - 1856 + - 2368 + - 1 + - 128 + - 1856 + - 1856 + - 128 + - 128 + - - 0 + - 1808.65 + - - - 6784 + - 3584 + - 1 + - 128 + - 6784 + - 6784 + - 128 + - 128 + - - 0 + - 2193.65 + - - - 704 + - 1408 + - 1 + - 3328 + - 704 + - 704 + - 3328 + - 3328 + - - 14 + - 2683.72 + - - - 64 + - 2368 + - 1 + - 1792 + - 64 + - 64 + - 1792 + - 1792 + - - 18 + - 1248.08 + - - - 4288 + - 1408 + - 1 + - 1792 + - 4288 + - 4288 + - 1792 + - 1792 + - - 11 + - 3500.0 + - - - 704 + - 256 + - 1 + - 128 + - 704 + - 704 + - 128 + - 128 + - - 3 + - 225.104 + - - - 704 + - 256 + - 1 + - 768 + - 704 + - 704 + - 768 + - 768 + - - 6 + - 1426.34 + - - - 704 + - 2368 + - 1 + - 1792 + - 704 + - 704 + - 1792 + - 1792 + - - 17 + - 3388.3 + - - - 1024 + - 4 + - 1 + - 1792 + - 1024 + - 1024 + - 1792 + - 1792 + - - 30 + - 91.8422 + - - - 5888 + - 4 + - 1 + - 128 + - 5888 + - 5888 + - 128 + - 128 + - - 23 + - 54.143 +- null diff --git a/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml new file mode 100644 index 000000000..a666e0b82 --- /dev/null +++ b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Ailk_Bjlk_SB.yaml @@ -0,0 +1,1379 @@ +- MinimumRequiredVersion: 4.13.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 5529.6 + 64: 8544.73 + 96: 9218.67 + 128: 9532.44 + 256: 10087.2 + 512: 10348.4 + 1024: 10511.6 + 2048: 10510.8 + 4096: 10631.3 + 8192: 10939.8 + 16192: 10997.9 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_GSU1_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 1.20019 + 64: 417.736 + 96: 611.623 + 128: 808.202 + 256: 1537.13 + 512: 2807.27 + 1024: 4662.54 + 2048: 6970.38 + 4096: 8826.89 + 8192: 9998.12 + 16192: 9087.35 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_GSU4_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 6145.75 + 64: 8266.1 + 96: 9185.37 + 128: 9740.14 + 256: 10424.6 + 512: 10925.8 + 1024: 11176.0 + 2048: 11539.7 + 4096: 11683.8 + 8192: 11962.5 + 16192: 12165.3 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 128 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x128x16_SE_GSU1_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 221.303 + 64: 381.272 + 96: 665.106 + 128: 922.62 + 256: 1850.72 + 512: 3026.4 + 1024: 5814.41 + 2048: 7955.42 + 4096: 10207.3 + 8192: 11229.3 + 16192: 12256.0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 128 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x128x16_SE_GSU4_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2533.83 + 64: 3950.43 + 96: 4847.85 + 128: 5396.06 + 256: 6364.49 + 512: 7097.05 + 1024: 7498.87 + 2048: 7656.46 + 4096: 7879.08 + 8192: 8520.96 + 16192: 7924.36 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_GSU1_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 208.806 + 64: 405.568 + 96: 612.211 + 128: 797.428 + 256: 1429.14 + 512: 2535.16 + 1024: 3763.76 + 2048: 5101.14 + 4096: 6740.96 + 8192: 6929.77 + 16192: 7425.59 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_GSU4_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 +- - 2 + - 3 + - 0 + - 1 +- [] +- null +- TileSelectionIndices: + - 0 + - 1 + - 2 + - 3 + - 4 + - 5 diff --git a/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml new file mode 100644 index 000000000..7bb88d1e0 --- /dev/null +++ b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Ailk_Bljk_SB.yaml @@ -0,0 +1,1379 @@ +- MinimumRequiredVersion: 4.13.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 5738.83 + 64: 8510.38 + 96: 8810.57 + 128: 9132.7 + 256: 9369.45 + 512: 9613.36 + 1024: 9691.51 + 2048: 9685.3 + 4096: 9786.43 + 8192: 10164.5 + 16192: 9124.15 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_GSU1_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 1.25244 + 64: 421.299 + 96: 615.464 + 128: 805.52 + 256: 1536.43 + 512: 2783.58 + 1024: 4633.6 + 2048: 6930.91 + 4096: 8550.04 + 8192: 10180.7 + 16192: 9461.62 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_GSU4_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 6208.62 + 64: 7904.53 + 96: 8924.75 + 128: 9424.01 + 256: 10351.5 + 512: 10824.8 + 1024: 11132.5 + 2048: 11619.9 + 4096: 11714.0 + 8192: 12082.0 + 16192: 12154.1 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 16 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x128x16_SE_GSU1_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 221.194 + 64: 387.729 + 96: 671.256 + 128: 920.669 + 256: 1838.0 + 512: 3260.5 + 1024: 6096.51 + 2048: 7862.09 + 4096: 9984.71 + 8192: 11218.7 + 16192: 12191.6 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 16 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x128x16_SE_GSU4_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2595.78 + 64: 4059.95 + 96: 4855.24 + 128: 5375.57 + 256: 6279.78 + 512: 6961.8 + 1024: 7229.96 + 2048: 7074.15 + 4096: 7131.13 + 8192: 7582.23 + 16192: 7700.57 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_GSU1_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 212.399 + 64: 423.147 + 96: 607.134 + 128: 789.276 + 256: 1456.47 + 512: 2479.28 + 1024: 3675.6 + 2048: 5018.26 + 4096: 6750.5 + 8192: 6807.74 + 16192: 7942.98 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_GSU4_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 +- - 2 + - 3 + - 0 + - 1 +- [] +- null +- TileSelectionIndices: + - 0 + - 1 + - 2 + - 3 + - 4 + - 5 diff --git a/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml new file mode 100644 index 000000000..b0179228f --- /dev/null +++ b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Alik_Bjlk_SB.yaml @@ -0,0 +1,1379 @@ +- MinimumRequiredVersion: 4.13.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 5692.67 + 64: 8510.38 + 96: 8822.78 + 128: 9142.53 + 256: 9369.48 + 512: 9591.65 + 1024: 9676.35 + 2048: 9658.46 + 4096: 9774.83 + 8192: 10180.3 + 16192: 9464.3 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_GSU1_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 1.25941 + 64: 418.683 + 96: 613.686 + 128: 798.703 + 256: 1515.6 + 512: 2686.94 + 1024: 4356.15 + 2048: 6273.41 + 4096: 7869.05 + 8192: 8419.6 + 16192: 8640.26 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_GSU4_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 6097.22 + 64: 7860.64 + 96: 9122.89 + 128: 9421.42 + 256: 10310.7 + 512: 10854.2 + 1024: 11133.4 + 2048: 11596.6 + 4096: 11881.6 + 8192: 12163.8 + 16192: 12404.8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x16_SE_GSU1_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 221.529 + 64: 379.772 + 96: 687.855 + 128: 938.628 + 256: 1843.99 + 512: 3398.55 + 1024: 5680.5 + 2048: 7871.78 + 4096: 9834.78 + 8192: 10804.4 + 16192: 11993.7 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x16_SE_GSU4_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2576.88 + 64: 4006.33 + 96: 4793.13 + 128: 5295.14 + 256: 5867.64 + 512: 6280.94 + 1024: 6478.57 + 2048: 5977.59 + 4096: 6364.19 + 8192: 6202.96 + 16192: 7189.04 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_GSU1_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 212.42 + 64: 418.807 + 96: 616.119 + 128: 807.665 + 256: 1415.8 + 512: 2381.77 + 1024: 3430.99 + 2048: 4555.79 + 4096: 5901.02 + 8192: 6005.52 + 16192: 6646.43 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_GSU4_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 +- - 2 + - 3 + - 0 + - 1 +- [] +- null +- TileSelectionIndices: + - 0 + - 1 + - 2 + - 3 + - 4 + - 5 diff --git a/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml new file mode 100644 index 000000000..f50c4bdac --- /dev/null +++ b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram941_Cijk_Alik_Bljk_SB.yaml @@ -0,0 +1,1815 @@ +- MinimumRequiredVersion: 4.13.0 +- aquavanjaram +- gfx941 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 5931.19 + 64: 8104.35 + 96: 8240.68 + 128: 8561.91 + 256: 8742.57 + 512: 8914.61 + 1024: 8973.48 + 2048: 8656.25 + 4096: 9027.43 + 8192: 8886.34 + 16192: 6343.9 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_GSU1_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 1.24612 + 64: 414.555 + 96: 614.692 + 128: 801.794 + 256: 1503.39 + 512: 2659.8 + 1024: 4206.22 + 2048: 6073.22 + 4096: 7639.45 + 8192: 8848.3 + 16192: 6554.51 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_GSU4_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 6114.75 + 64: 7610.59 + 96: 9025.94 + 128: 9247.04 + 256: 10188.5 + 512: 10817.9 + 1024: 11126.6 + 2048: 11522.1 + 4096: 11353.5 + 8192: 11837.4 + 16192: 12466.0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_GSU1_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 220.236 + 64: 379.22 + 96: 661.446 + 128: 923.798 + 256: 1812.02 + 512: 3237.2 + 1024: 5726.21 + 2048: 7468.78 + 4096: 9922.38 + 8192: 10968.3 + 16192: 12151.2 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_GSU4_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2288.11 + 64: 3778.23 + 96: 4083.33 + 128: 4546.82 + 256: 4949.54 + 512: 5311.69 + 1024: 5215.47 + 2048: 4954.59 + 4096: 4860.66 + 8192: 4849.04 + 16192: 5054.93 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x16_SE_GSU1_TT4_4_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 247.593 + 64: 497.038 + 96: 736.935 + 128: 961.664 + 256: 1695.97 + 512: 2714.41 + 1024: 1534.77 + 2048: 4262.15 + 4096: 4609.4 + 8192: 4900.8 + 16192: 5970.17 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x16_SE_GSU4_TT4_4_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2681.0 + 64: 4025.32 + 96: 4836.8 + 128: 5182.06 + 256: 5717.53 + 512: 6010.9 + 1024: 3909.06 + 2048: 5210.48 + 4096: 5743.88 + 8192: 5474.81 + 16192: 6605.2 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_GSU1_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 212.081 + 64: 398.901 + 96: 622.927 + 128: 802.475 + 256: 1400.74 + 512: 2314.28 + 1024: 3167.55 + 2048: 4116.89 + 4096: 5267.94 + 8192: 5085.11 + 16192: 6480.19 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_GSU4_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 +- - 2 + - 3 + - 0 + - 1 +- [] +- null +- TileSelectionIndices: + - 0 + - 1 + - 2 + - 3 + - 4 + - 5 + - 6 + - 7 diff --git a/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml new file mode 100644 index 000000000..92e1cf40d --- /dev/null +++ b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Ailk_Bjlk_SB.yaml @@ -0,0 +1,1379 @@ +- MinimumRequiredVersion: 4.13.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 5529.6 + 64: 8544.73 + 96: 9218.67 + 128: 9532.44 + 256: 10087.2 + 512: 10348.4 + 1024: 10511.6 + 2048: 10510.8 + 4096: 10631.3 + 8192: 10939.8 + 16192: 10997.9 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_GSU1_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 1.20019 + 64: 417.736 + 96: 611.623 + 128: 808.202 + 256: 1537.13 + 512: 2807.27 + 1024: 4662.54 + 2048: 6970.38 + 4096: 8826.89 + 8192: 9998.12 + 16192: 9087.35 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_GSU4_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 6145.75 + 64: 8266.1 + 96: 9185.37 + 128: 9740.14 + 256: 10424.6 + 512: 10925.8 + 1024: 11176.0 + 2048: 11539.7 + 4096: 11683.8 + 8192: 11962.5 + 16192: 12165.3 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 128 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x128x16_SE_GSU1_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 221.303 + 64: 381.272 + 96: 665.106 + 128: 922.62 + 256: 1850.72 + 512: 3026.4 + 1024: 5814.41 + 2048: 7955.42 + 4096: 10207.3 + 8192: 11229.3 + 16192: 12256.0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 128 + LSPA: 8 + LSPB: 8 + LVCA: 32 + LVCB: 32 + LVPA: 2 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT128x128x16_SE_GSU4_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2533.83 + 64: 3950.43 + 96: 4847.85 + 128: 5396.06 + 256: 6364.49 + 512: 7097.05 + 1024: 7498.87 + 2048: 7656.46 + 4096: 7879.08 + 8192: 8520.96 + 16192: 7924.36 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_GSU1_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 208.806 + 64: 405.568 + 96: 612.211 + 128: 797.428 + 256: 1429.14 + 512: 2535.16 + 1024: 3763.76 + 2048: 5101.14 + 4096: 6740.96 + 8192: 6929.77 + 16192: 7425.59 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 64 + LSPA: 16 + LSPB: 16 + LVCA: 16 + LVCB: 16 + LVPA: 4 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bjlk_SB_MT64x64x16_SE_GSU4_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 +- - 2 + - 3 + - 0 + - 1 +- [] +- null +- TileSelectionIndices: + - 0 + - 1 + - 2 + - 3 + - 4 + - 5 diff --git a/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml new file mode 100644 index 000000000..9728ce7bc --- /dev/null +++ b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Ailk_Bljk_SB.yaml @@ -0,0 +1,1379 @@ +- MinimumRequiredVersion: 4.13.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 5738.83 + 64: 8510.38 + 96: 8810.57 + 128: 9132.7 + 256: 9369.45 + 512: 9613.36 + 1024: 9691.51 + 2048: 9685.3 + 4096: 9786.43 + 8192: 10164.5 + 16192: 9124.15 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_GSU1_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 1.25244 + 64: 421.299 + 96: 615.464 + 128: 805.52 + 256: 1536.43 + 512: 2783.58 + 1024: 4633.6 + 2048: 6930.91 + 4096: 8550.04 + 8192: 10180.7 + 16192: 9461.62 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_GSU4_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 6208.62 + 64: 7904.53 + 96: 8924.75 + 128: 9424.01 + 256: 10351.5 + 512: 10824.8 + 1024: 11132.5 + 2048: 11619.9 + 4096: 11714.0 + 8192: 12082.0 + 16192: 12154.1 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 16 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x128x16_SE_GSU1_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 221.194 + 64: 387.729 + 96: 671.256 + 128: 920.669 + 256: 1838.0 + 512: 3260.5 + 1024: 6096.51 + 2048: 7862.09 + 4096: 9984.71 + 8192: 11218.7 + 16192: 12191.6 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 128 + LSCB: 16 + LSPA: 8 + LSPB: 64 + LVCA: 32 + LVCB: 4 + LVPA: 2 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT128x128x16_SE_GSU4_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2595.78 + 64: 4059.95 + 96: 4855.24 + 128: 5375.57 + 256: 6279.78 + 512: 6961.8 + 1024: 7229.96 + 2048: 7074.15 + 4096: 7131.13 + 8192: 7582.23 + 16192: 7700.57 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_GSU1_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: false + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 212.399 + 64: 423.147 + 96: 607.134 + 128: 789.276 + 256: 1456.47 + 512: 2479.28 + 1024: 3675.6 + 2048: 5018.26 + 4096: 6750.5 + 8192: 6807.74 + 16192: 7942.98 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 64 + LSCB: 16 + LSPA: 16 + LSPB: 64 + LVCA: 16 + LVCB: 4 + LVPA: 4 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 0 + - 3 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 1 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: true + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: false + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Ailk_Bljk_SB_MT64x64x16_SE_GSU4_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 +- - 2 + - 3 + - 0 + - 1 +- [] +- null +- TileSelectionIndices: + - 0 + - 1 + - 2 + - 3 + - 4 + - 5 diff --git a/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml new file mode 100644 index 000000000..29f5e5759 --- /dev/null +++ b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Alik_Bjlk_SB.yaml @@ -0,0 +1,1379 @@ +- MinimumRequiredVersion: 4.13.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 5692.67 + 64: 8510.38 + 96: 8822.78 + 128: 9142.53 + 256: 9369.48 + 512: 9591.65 + 1024: 9676.35 + 2048: 9658.46 + 4096: 9774.83 + 8192: 10180.3 + 16192: 9464.3 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_GSU1_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 1.25941 + 64: 418.683 + 96: 613.686 + 128: 798.703 + 256: 1515.6 + 512: 2686.94 + 1024: 4356.15 + 2048: 6273.41 + 4096: 7869.05 + 8192: 8419.6 + 16192: 8640.26 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_GSU4_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 6097.22 + 64: 7860.64 + 96: 9122.89 + 128: 9421.42 + 256: 10310.7 + 512: 10854.2 + 1024: 11133.4 + 2048: 11596.6 + 4096: 11881.6 + 8192: 12163.8 + 16192: 12404.8 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x16_SE_GSU1_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 221.529 + 64: 379.772 + 96: 687.855 + 128: 938.628 + 256: 1843.99 + 512: 3398.55 + 1024: 5680.5 + 2048: 7871.78 + 4096: 9834.78 + 8192: 10804.4 + 16192: 11993.7 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 128 + LSPA: 64 + LSPB: 8 + LVCA: 4 + LVCB: 32 + LVPA: 16 + LVPB: 2 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT128x128x16_SE_GSU4_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2576.88 + 64: 4006.33 + 96: 4793.13 + 128: 5295.14 + 256: 5867.64 + 512: 6280.94 + 1024: 6478.57 + 2048: 5977.59 + 4096: 6364.19 + 8192: 6202.96 + 16192: 7189.04 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_GSU1_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: false + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 212.42 + 64: 418.807 + 96: 616.119 + 128: 807.665 + 256: 1415.8 + 512: 2381.77 + 1024: 3430.99 + 2048: 4555.79 + 4096: 5901.02 + 8192: 6005.52 + 16192: 6646.43 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 64 + LSPA: 64 + LSPB: 16 + LVCA: 4 + LVCB: 16 + LVPA: 16 + LVPB: 4 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 1 + - 3 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 1 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: true + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: true + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bjlk_SB_MT64x64x16_SE_GSU4_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: false + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 +- - 2 + - 3 + - 0 + - 1 +- [] +- null +- TileSelectionIndices: + - 0 + - 1 + - 2 + - 3 + - 4 + - 5 diff --git a/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml new file mode 100644 index 000000000..9904e9f23 --- /dev/null +++ b/HostLibraryTests/configs/tile_aware_selection/aquavanjaram942_Cijk_Alik_Bljk_SB.yaml @@ -0,0 +1,1815 @@ +- MinimumRequiredVersion: 4.13.0 +- aquavanjaram +- gfx942 +- - Device 0049 + - Device 0050 +- AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] +- - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 5931.19 + 64: 8104.35 + 96: 8240.68 + 128: 8561.91 + 256: 8742.57 + 512: 8914.61 + 1024: 8973.48 + 2048: 8656.25 + 4096: 9027.43 + 8192: 8886.34 + 16192: 6343.9 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 0 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_GSU1_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 1.24612 + 64: 414.555 + 96: 614.692 + 128: 801.794 + 256: 1503.39 + 512: 2659.8 + 1024: 4206.22 + 2048: 6073.22 + 4096: 7639.45 + 8192: 8848.3 + 16192: 6554.51 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 1 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_GSU4_TT4_4_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 6114.75 + 64: 7610.59 + 96: 9025.94 + 128: 9247.04 + 256: 10188.5 + 512: 10817.9 + 1024: 11126.6 + 2048: 11522.1 + 4096: 11353.5 + 8192: 11837.4 + 16192: 12466.0 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 2 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_GSU1_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 220.236 + 64: 379.22 + 96: 661.446 + 128: 923.798 + 256: 1812.02 + 512: 3237.2 + 1024: 5726.21 + 2048: 7468.78 + 4096: 9922.38 + 8192: 10968.3 + 16192: 12151.2 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 8192 + LdsNumElementsAlignedA: 2048 + LdsNumElementsAlignedB: 2048 + LdsOffsetA: 0 + LdsOffsetA_Blk: 4096 + LdsOffsetB: 2048 + LdsOffsetB_Blk: 6144 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 1 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 16 + MacroTile0: 128 + MacroTile1: 128 + MacroTileA: 128 + MacroTileB: 128 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 64 + NumGlobalWriteVectorsPerThread: 16 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 2 + NumLoadsPerpendicularB: 2 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 3 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT128x128x16_SE_GSU4_TT8_8_WG16_16_1 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 16 + SubGroup1: 16 + SubGroupA: 16 + SubGroupB: 16 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 16 + - 16 + - 1 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2288.11 + 64: 3778.23 + 96: 4083.33 + 128: 4546.82 + 256: 4949.54 + 512: 5311.69 + 1024: 5215.47 + 2048: 4954.59 + 4096: 4860.66 + 8192: 4849.04 + 16192: 5054.93 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 4 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x16_SE_GSU1_TT4_4_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 2 + GlobalLoadVectorWidthB: 2 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 247.593 + 64: 497.038 + 96: 736.935 + 128: 961.664 + 256: 1695.97 + 512: 2714.41 + 1024: 1534.77 + 2048: 4262.15 + 4096: 4609.4 + 8192: 4900.8 + 16192: 5970.17 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 32 + LSPB: 32 + LVCA: 8 + LVCB: 8 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 4096 + LdsNumElementsAlignedA: 512 + LdsNumElementsAlignedB: 512 + LdsOffsetA: 0 + LdsOffsetA_Blk: 1024 + LdsOffsetB: 512 + LdsOffsetB_Blk: 1536 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 32 + MacroTile1: 32 + MacroTileA: 32 + MacroTileB: 32 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 4 + NumGlobalWriteVectorsPerThread: 1 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 5 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT32x32x16_SE_GSU4_TT4_4_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 4 + - 4 + ThreadTile0: 4 + ThreadTile1: 4 + ThreadTileA: 4 + ThreadTileB: 4 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 1 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 2681.0 + 64: 4025.32 + 96: 4836.8 + 128: 5182.06 + 256: 5717.53 + 512: 6010.9 + 1024: 3909.06 + 2048: 5210.48 + 4096: 5743.88 + 8192: 5474.81 + 16192: 6605.2 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 6 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_GSU1_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 + - AggressivePerfMode: 1 + AssertFree0ElementMultiple: 1 + AssertFree1ElementMultiple: 1 + AssertMinApproxSize: 3 + AssertSummationElementMultiple: 1 + AssignedDerivedParameters: false + AssignedProblemIndependentDerivedParameters: true + BufferLoad: true + BufferStore: true + CheckDimOverflow: 0 + CheckTensorDimAsserts: false + DepthU: 16 + DirectToLds: false + DirectToLdsA: false + DirectToLdsB: false + DisableAtomicFail: 0 + DisableKernelPieces: 0 + EdgeType: ShiftPtr + ExpandPointerSwap: true + FractionalLoad: 1 + GlobalLoadVectorWidthA: 4 + GlobalLoadVectorWidthB: 4 + GlobalRead2A: true + GlobalRead2B: true + GlobalReadCoalesceGroupA: true + GlobalReadCoalesceGroupB: true + GlobalReadCoalesceVectorA: true + GlobalReadCoalesceVectorB: true + GlobalReadVectorWidth: 4 + GlobalSplitU: 4 + GlobalSplitUSummationAssignmentRoundRobin: true + GlobalSplitUWorkGroupMappingRoundRobin: false + GlobalWriteVectorWidth: 4 + GuaranteeNoPartialA: true + GuaranteeNoPartialB: true + ISA: + - 9 + - 0 + - 8 + Ideals: + 32: 212.081 + 64: 398.901 + 96: 622.927 + 128: 802.475 + 256: 1400.74 + 512: 2314.28 + 1024: 3167.55 + 2048: 4116.89 + 4096: 5267.94 + 8192: 5085.11 + 16192: 6480.19 + InnerUnroll: 1 + InterleaveAlpha: 0 + KernelLanguage: Assembly + LSCA: 16 + LSCB: 16 + LSPA: 64 + LSPB: 64 + LVCA: 4 + LVCB: 4 + LVPA: 16 + LVPB: 16 + LdcEqualsLdd: true + LdsNumElements: 16384 + LdsNumElementsAlignedA: 1024 + LdsNumElementsAlignedB: 1024 + LdsOffsetA: 0 + LdsOffsetA_Blk: 2048 + LdsOffsetB: 1024 + LdsOffsetB_Blk: 3072 + LdsPadA: 0 + LdsPadB: 0 + LocalDotLayout: 1 + LocalRead2A: true + LocalRead2B: true + LocalSplitU: 4 + LocalWrite2A: true + LocalWrite2B: true + LocalWriteUseSgprA: false + LocalWriteUseSgprB: false + LoopDoWhile: false + LoopTail: true + LoopUnroll: 4 + MacroTile0: 64 + MacroTile1: 64 + MacroTileA: 64 + MacroTileB: 64 + MacroTileShapeMax: 64 + MacroTileShapeMin: 1 + MaxOccupancy: 40 + MaxVgprNumber: 256 + MinVgprNumber: 0 + NonTemporalA: 0 + NonTemporalB: 0 + NonTemporalC: 0 + NumElementsPerThread: 16 + NumGlobalWriteVectorsPerThread: 4 + NumLoadsCoalescedA: 1 + NumLoadsCoalescedB: 1 + NumLoadsPerpendicularA: 1 + NumLoadsPerpendicularB: 1 + NumThreads: 256 + OptNoLoadLoop: 1 + PackBatchDims: 0 + PackFreeDims: 1 + PackGranularity: 2 + PackedC0IdxChars: + - I + PackedC0IndicesX: + - 0 + PackedC1IdxChars: + - J + PackedC1IndicesX: + - 1 + PerformanceSyncLocation: -1 + PerformanceWaitCount: -1 + PerformanceWaitLocation: -1 + PersistentKernel: 0 + PrefetchAcrossPersistent: 0 + PrefetchGlobalRead: true + PrefetchLocalRead: true + ProblemType: + AssignedDerivedParameters: true + Batched: true + ComplexConjugateA: false + ComplexConjugateB: false + ComputeDataType: 0 + ConvolutionConfig: [] + DataType: 0 + DestDataType: 0 + HighPrecisionAccumulate: false + Index0: 0 + Index01A: 0 + Index01B: 1 + Index1: 1 + IndexAssignmentsA: + - 3 + - 0 + - 2 + IndexAssignmentsB: + - 3 + - 1 + - 2 + IndexAssignmentsLD: + - 4 + - 5 + - 6 + - 7 + IndexUnroll: 3 + IndexUnrollA: 0 + IndexUnrollB: 0 + IndicesBatch: + - 2 + IndicesFree: + - 0 + - 1 + IndicesSummation: + - 3 + NumIndicesBatch: 1 + NumIndicesC: 3 + NumIndicesFree: 2 + NumIndicesLD: 4 + NumIndicesSummation: 1 + OperationType: GEMM + SetConstStrideA: [] + SetConstStrideB: [] + SilentHighPrecisionAccumulate: false + TLUA: false + TLUB: false + Tensor0: 0 + Tensor1: 1 + TileA: 0 + TileAwareSelection: true + TileB: 1 + TotalIndices: 4 + TransposeA: true + TransposeB: false + UseBeta: true + UseInitialStridesAB: false + ZeroPadA: [] + ZeroPadB: [] + ReplacementKernel: false + ScheduleGlobalRead: 1 + ScheduleIterAlg: 1 + ScheduleLocalWrite: 1 + SolutionIndex: 7 + SolutionNameMin: Cijk_Alik_Bljk_SB_MT64x64x16_SE_GSU4_TT8_8_WG8_8_4 + StaggerU: 32 + StaggerUMapping: 0 + StaggerUStride: 256 + SubGroup0: 8 + SubGroup1: 8 + SubGroupA: 8 + SubGroupB: 8 + SuppressNoLoadLoop: false + ThreadTile: + - 8 + - 8 + ThreadTile0: 8 + ThreadTile1: 8 + ThreadTileA: 8 + ThreadTileB: 8 + UnrollMemFence: false + UseSgprForGRO: 1 + Valid: true + VectorAtomicWidth: 1 + VectorStore: true + VectorWidth: 4 + WorkGroup: + - 8 + - 8 + - 4 + WorkGroupMapping: 1 + WorkGroupMappingType: B + _staggerStrideShift: 2 + fractionalPerpOverhangA: 0 + fractionalPerpOverhangB: 0 +- - 2 + - 3 + - 0 + - 1 +- [] +- null +- TileSelectionIndices: + - 0 + - 1 + - 2 + - 3 + - 4 + - 5 + - 6 + - 7 From c645384c7c1d3139ee69a8621a0fe6b192ede727 Mon Sep 17 00:00:00 2001 From: Babak Poursartip Date: Wed, 20 Dec 2023 16:03:40 -0600 Subject: [PATCH 24/51] adding code owners file (#1852) Co-authored-by: Babak --- .github/CODEOWNERS | 1 + 1 file changed, 1 insertion(+) create mode 100644 .github/CODEOWNERS diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS new file mode 100644 index 000000000..2c966a9dc --- /dev/null +++ b/.github/CODEOWNERS @@ -0,0 +1 @@ +* @babakpst @yoichiyoshida @bragadeesh @AlexBrownAMD From b23f55bb758d088d05a2bbbd0a7b0cfeaca017fd Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Thu, 21 Dec 2023 16:46:37 +0900 Subject: [PATCH 25/51] Revert "Optimization for ShadowLimit (#1829)" (#1855) This reverts commit 9e8f1ab9b708c52271dd53d5e20d45c59d3b5993. --- Tensile/KernelWriter.py | 23 ----- Tensile/KernelWriterAssembly.py | 146 +++++++++++++++----------------- 2 files changed, 66 insertions(+), 103 deletions(-) diff --git a/Tensile/KernelWriter.py b/Tensile/KernelWriter.py index e51b22e63..ca9fbd6ce 100644 --- a/Tensile/KernelWriter.py +++ b/Tensile/KernelWriter.py @@ -3748,29 +3748,6 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): self.tailLoopInNLL = noTailLoop >= 2 self.noEarlyExitForTailLoopInNLL = noTailLoop == 3 - # no ShadowLimit code in loop optimization - # we do not need ShadowLimit check in loop under certain conditions - # noTailLoop=1 (TODO: support TailLoop) - # BufferLoad - # FractionalLoad==0 - # no packBatchDims - # EdgeType == Shift - # CheckDimOverflow < 2 - # MT0, MT1, DepthU are power of 2 - # TLU case only - def isPowerOf2(val): - return val > 0 and (val & (val - 1)) == 0 - self.noShadowLimitCodeInLoopA = False - self.noShadowLimitCodeInLoopB = False - if noTailLoop == 1 and kernel["BufferLoad"] and kernel["FractionalLoad"] == 0 and \ - kernel["PackBatchDims"] == 0 and kernel["EdgeType"] == "ShiftPtr" and \ - kernel["CheckDimOverflow"] <= 1 and \ - isPowerOf2(kernel["MacroTileA"]) and isPowerOf2(kernel["MacroTileB"]) and isPowerOf2(kernel["DepthU"]): - if tluA: - self.noShadowLimitCodeInLoopA = True - if tluB: - self.noShadowLimitCodeInLoopB = True - self.actualSummationLoops = 1 if kernel["PackSummationDims"] else kernel["ProblemType"]["NumIndicesSummation"] self.otherSummationLoops = self.actualSummationLoops-1 self.otherSummations = kernel["ProblemType"]["NumIndicesSummation"]-1 # not loops but summations vars diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 8153375f3..2637949e0 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -596,10 +596,8 @@ def defineVariableSgprs(self, kernel): self.defineSgpr("PerpOverhangVccB", 2, 2) if self.use64bShadowLimit: # If need more SGPR could overlap this with the Tensor2dSize regs - if self.noShadowLimitCodeInLoopA == False: - self.defineSgpr("ShadowLimitA", 2, 2) - if self.noShadowLimitCodeInLoopB == False: - self.defineSgpr("ShadowLimitB", 2, 2) + self.defineSgpr("ShadowLimitA", 2, 2) + self.defineSgpr("ShadowLimitB", 2, 2) if kernel["PackSummationDims"]: for tc in ('A','B'): @@ -4937,44 +4935,38 @@ def computeLoadSrd(self, kernel, tP, tc, indices, bpe, isPap): kStr += inst("s_mov_b32", sgpr(tileStart+0), 0, "set default tileStart") kStr += inst("s_mov_b32", sgpr(tileStart+1), 0, "set default tileStart") - noShadowLimitCodeInLoop = self.noShadowLimitCodeInLoopA if tc == "A" else self.noShadowLimitCodeInLoopB - if noShadowLimitCodeInLoop == False: - if self.use64bShadowLimit: - limitTmp0 = "ShadowLimit%s+0"%tc - limitTmp1 = "ShadowLimit%s+1"%tc - else: - limitTmp0 = stmp+0 - limitTmp1 = stmp+1 + if self.use64bShadowLimit: + limitTmp0 = "ShadowLimit%s+0"%tc + limitTmp1 = "ShadowLimit%s+1"%tc + else: + limitTmp0 = stmp+0 + limitTmp1 = stmp+1 - kStr += inst("s_sub_u32", sgpr(limitTmp0), sgpr("Tensor2dSize%s"%tc), sgpr(tileStart+0), "sub tileStart") - kStr += inst("s_subb_u32", sgpr(limitTmp1), sgpr("Tensor2dSize%s+1"%tc), sgpr(tileStart+1), "sub tileStart") + kStr += inst("s_sub_u32", sgpr(limitTmp0), sgpr("Tensor2dSize%s"%tc), sgpr(tileStart+0), "sub tileStart") + kStr += inst("s_subb_u32", sgpr(limitTmp1), sgpr("Tensor2dSize%s+1"%tc), sgpr(tileStart+1), "sub tileStart") - if self.use64bShadowLimit: - # Set initial buffer limit - # if the limit is >64bit, incrementSrd decrements the shadow as the SRD increments, - # and when we get within 32-bit we start to step down the SRD - # if the limit is <32bits, set it accurately here: - # Note lshl_b64 the higher-numbered SGPR has the upper 32-bits - kStr += inst("s_lshl_b64", sgpr("ShadowLimit%s"%tc,2), sgpr("ShadowLimit%s"%tc,2), \ - hex(log2(tP["bpe"])), "Set limit to use bytes") - if prePad: - kStr += inst("s_add_u32", sgpr("ShadowLimit%s+0"%tc), sgpr("ShadowLimit%s+0"%tc), prePad, "extend limit for pre-pad") - kStr += inst("s_addc_u32", sgpr("ShadowLimit%s+1"%tc), sgpr("ShadowLimit%s+1"%tc), 0, "extend limit for pre-pad") - - if kernel["DirectToLds%s"%tc] and kernel["UseInstOffsetForGRO"]: - kStr += inst("s_add_u32", sgpr("ShadowLimit%s+0"%tc), sgpr("ShadowLimit%s+0"%tc), self.buff_load_inst_offset_max, "extend limit for directToLDS instruction offset") - kStr += inst("s_addc_u32", sgpr("ShadowLimit%s+1"%tc), sgpr("ShadowLimit%s+1"%tc), 0, "extend limit for directToLDS instruction offset") - - kStr += inst("s_cmp_eq_u32", sgpr("ShadowLimit%s+1"%tc), 0, "are we within 2^32?") - kStr += inst("s_cselect_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "BufferLimit%s"%tc, "Move shadow to real if we are within 2^32") - else: - # put limit directly into SRD: - kStr += inst("s_lshl_b32", sgpr("Srd%s+2"%tc), sgpr(stmp+0), hex(log2(tP["bpe"])), "Set limit to use bytes") - kStr += inst("s_add_u32", sgpr("Srd%s+2"%tc), sgpr("Srd%s+2"%tc), prePad, "extend limit for pre-pad") + if self.use64bShadowLimit: + # Set initial buffer limit + # if the limit is >64bit, incrementSrd decrements the shadow as the SRD increments, + # and when we get within 32-bit we start to step down the SRD + # if the limit is <32bits, set it accurately here: + # Note lshl_b64 the higher-numbered SGPR has the upper 32-bits + kStr += inst("s_lshl_b64", sgpr("ShadowLimit%s"%tc,2), sgpr("ShadowLimit%s"%tc,2), \ + hex(log2(tP["bpe"])), "Set limit to use bytes") + if prePad: + kStr += inst("s_add_u32", sgpr("ShadowLimit%s+0"%tc), sgpr("ShadowLimit%s+0"%tc), prePad, "extend limit for pre-pad") + kStr += inst("s_addc_u32", sgpr("ShadowLimit%s+1"%tc), sgpr("ShadowLimit%s+1"%tc), 0, "extend limit for pre-pad") + + if kernel["DirectToLds%s"%tc] and kernel["UseInstOffsetForGRO"]: + kStr += inst("s_add_u32", sgpr("ShadowLimit%s+0"%tc), sgpr("ShadowLimit%s+0"%tc), self.buff_load_inst_offset_max, "extend limit for directToLDS instruction offset") + kStr += inst("s_addc_u32", sgpr("ShadowLimit%s+1"%tc), sgpr("ShadowLimit%s+1"%tc), 0, "extend limit for directToLDS instruction offset") + + kStr += inst("s_cmp_eq_u32", sgpr("ShadowLimit%s+1"%tc), 0, "are we within 2^32?") + kStr += inst("s_cselect_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "BufferLimit%s"%tc, "Move shadow to real if we are within 2^32") else: - # noShadowLimitCodeInLoop case - # no out of range check - kStr += inst("s_mov_b32", sgpr("Srd%s+2"%tc), "BufferLimit%s"%tc, "Set BufferLimit in no ShadowLimit code case") + # put limit directly into SRD: + kStr += inst("s_lshl_b32", sgpr("Srd%s+2"%tc), sgpr(stmp+0), hex(log2(tP["bpe"])), "Set limit to use bytes") + kStr += inst("s_add_u32", sgpr("Srd%s+2"%tc), sgpr("Srd%s+2"%tc), prePad, "extend limit for pre-pad") # Apply any high-order address components to the tileStart and eventually the SRD - batch idx for batched gemm if kernel["ProblemType"]["StridedBatched"]: @@ -5065,7 +5057,7 @@ def computeLoadSrd(self, kernel, tP, tc, indices, bpe, isPap): # invalid global read for performance evaluation only if self.enable["InvalidGlobalRead%s"%tc]: kStr += inst("s_mov_b32", sgpr("Srd%s+2"%tc), hex(0), "set out-of-bound addr for performance evaluation only") - if noShadowLimitCodeInLoop == False and self.use64bShadowLimit: + if self.use64bShadowLimit: kStr += inst("s_mov_b32", sgpr("ShadowLimit%s+1"%tc), hex(0xffffffff), "set out-of-bound addr for performance evaluation only") return kStr @@ -7751,34 +7743,32 @@ def incrementSrd(self, kernel, tP, incLower, incUpper, checkShadowLimitCopy=True incUpper, \ "gra SRD += inc(upper)" ) - noShadowLimitCodeInLoop = self.noShadowLimitCodeInLoopA if tc == "A" else self.noShadowLimitCodeInLoopB - if noShadowLimitCodeInLoop == False: - # also have to move the boundary since we change the base - # so less buffers to the edge: - if self.use64bShadowLimit: - imod.addInst("s_sub_u32", \ - sgpr("ShadowLimit%s+0"%tc), \ - sgpr("ShadowLimit%s+0"%tc), \ - incLower, \ - "limit -= inc)") - imod.addInst("s_subb_u32", \ - sgpr("ShadowLimit%s+1"%tc), \ - sgpr("ShadowLimit%s+1"%tc), \ - incUpper, \ - "limit -= inc)" ) - if checkShadowLimitCopy: - imod.addInst("s_cmp_eq_u32", sgpr("ShadowLimit%s+1"%tc), 0, "are we within 2^32?") - if self.staggerU: - # staggerU case, need to restore BufferLimit when ShadowLimit goes to negative value - imod.addInst("s_cselect_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "BufferLimit%s"%tc, "Move shadow to real if we are within 2^32") - else: - imod.addInst("s_cmov_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "Move shadow to real if we are within 2^32") - else: - imod.addInst("s_sub_u32", \ - sgpr("Srd%s+2"%(tc)), \ - sgpr("Srd%s+2"%(tc)), \ - incLower, \ - "limit -= inc)" ) + # also have to move the boundary since we change the base + # so less buffers to the edge: + if self.use64bShadowLimit: + imod.addInst("s_sub_u32", \ + sgpr("ShadowLimit%s+0"%tc), \ + sgpr("ShadowLimit%s+0"%tc), \ + incLower, \ + "limit -= inc)") + imod.addInst("s_subb_u32", \ + sgpr("ShadowLimit%s+1"%tc), \ + sgpr("ShadowLimit%s+1"%tc), \ + incUpper, \ + "limit -= inc)" ) + if checkShadowLimitCopy: + imod.addInst("s_cmp_eq_u32", sgpr("ShadowLimit%s+1"%tc), 0, "are we within 2^32?") + if self.staggerU: + # staggerU case, need to restore BufferLimit when ShadowLimit goes to negative value + imod.addInst("s_cselect_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "BufferLimit%s"%tc, "Move shadow to real if we are within 2^32") + else: + imod.addInst("s_cmov_b32", sgpr("Srd%s+2"%tc), sgpr("ShadowLimit%s+0"%tc), "Move shadow to real if we are within 2^32") + else: + imod.addInst("s_sub_u32", \ + sgpr("Srd%s+2"%(tc)), \ + sgpr("Srd%s+2"%(tc)), \ + incLower, \ + "limit -= inc)" ) return imod ############################################################################## @@ -8032,14 +8022,12 @@ def globalReadIncrementAB(self, kernel, loopIdx, prefetchIndex, incs=1): for tc in ('A','B'): incCodeA.addInst("s_mov_b32", sgpr("Srd%s+0"%tc), sgpr("InitialSrd%sBase+0"%tc), "restore base") incCodeA.addInst("s_mov_b32", sgpr("Srd%s+1"%tc), sgpr("InitialSrd%sBase+1"%tc), "restore base") - noShadowLimitCodeInLoop = self.noShadowLimitCodeInLoopA if tc == "A" else self.noShadowLimitCodeInLoopB - if noShadowLimitCodeInLoop == False: - if self.use64bShadowLimit: - incCodeA.addInst("s_mov_b32", sgpr("ShadowLimit%s+0"%tc), sgpr("InitialSrd%sLimit+0"%tc), "restore shadow limit") - incCodeA.addInst("s_mov_b32", sgpr("ShadowLimit%s+1"%tc), sgpr("InitialSrd%sLimit+1"%tc), "restore shadow limit") - assert(0) # not tested, would maybe need to restore base too if limit 0 - else: - incCodeA.addInst("s_mov_b32", sgpr("Srd%s+2"%tc), sgpr("InitialSrd%sLimit"%tc), "restore limit") + if self.use64bShadowLimit: + incCodeA.addInst("s_mov_b32", sgpr("ShadowLimit%s+0"%tc), sgpr("InitialSrd%sLimit+0"%tc), "restore shadow limit") + incCodeA.addInst("s_mov_b32", sgpr("ShadowLimit%s+1"%tc), sgpr("InitialSrd%sLimit+1"%tc), "restore shadow limit") + assert(0) # not tested, would maybe need to restore base too if limit 0 + else: + incCodeA.addInst("s_mov_b32", sgpr("Srd%s+2"%tc), sgpr("InitialSrd%sLimit"%tc), "restore limit") # TODO - this skips over the stagger-u wrap codes @@ -15093,10 +15081,8 @@ def openPrefetchAcrossPersistent(self, kernel, isOptNLL, useBufferOOB=False): # reseting SrdA/B, ShadowLimitA/B, GlobalReadIncsA/B is more efficiently way than using BufferOOB imod.addInst("s_cmov_b32", sgpr("SrdA+2"), 0, "Set SrdA+2 to 0 for outside legal WG") imod.addInst("s_cmov_b32", sgpr("SrdB+2"), 0, "Set SrdB+2 to 0 for outside legal WG") - if self.noShadowLimitCodeInLoopA == False: - imod.addInst("s_cmov_b64", sgpr("ShadowLimitA", 2), 0, "Set ShadowLimitA to 0 for outside legal WG") - if self.noShadowLimitCodeInLoopB == False: - imod.addInst("s_cmov_b64", sgpr("ShadowLimitB", 2), 0, "Set ShadowLimitB to 0 for outside legal WG") + imod.addInst("s_cmov_b64", sgpr("ShadowLimitA", 2), 0, "Set ShadowLimitA to 0 for outside legal WG") + imod.addInst("s_cmov_b64", sgpr("ShadowLimitB", 2), 0, "Set ShadowLimitB to 0 for outside legal WG") imod.addInst("s_cmov_b32", sgpr("GlobalReadIncsA"), 0, "Stop decrementing ShadowLimitA and incrementing SrdA for outside legal WG") imod.addInst("s_cmov_b32", sgpr("GlobalReadIncsB"), 0, "Stop decrementing ShadowLimitB and incrementing SrdB for outside legal WG") else: From 3f431a65c112a290ee10ab593042ac68cb0222ee Mon Sep 17 00:00:00 2001 From: Babak Poursartip Date: Thu, 21 Dec 2023 12:58:49 -0600 Subject: [PATCH 26/51] updating Codeowners file (#1856) --- .github/CODEOWNERS | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/CODEOWNERS b/.github/CODEOWNERS index 2c966a9dc..b337c8b28 100644 --- a/.github/CODEOWNERS +++ b/.github/CODEOWNERS @@ -1 +1 @@ -* @babakpst @yoichiyoshida @bragadeesh @AlexBrownAMD +* @babakpst @yoichiyoshida @bragadeesh @AlexBrownAMD @nakajee \ No newline at end of file From 900fb387d42c1d3d2f3c465f3c63135688dc327f Mon Sep 17 00:00:00 2001 From: Babak Poursartip Date: Tue, 2 Jan 2024 16:47:00 -0600 Subject: [PATCH 27/51] updating lib logic convertor script (#1857) --- tuning/automation/LibraryLogicConvertor.py | 74 ++++++++++++---------- 1 file changed, 40 insertions(+), 34 deletions(-) diff --git a/tuning/automation/LibraryLogicConvertor.py b/tuning/automation/LibraryLogicConvertor.py index 988aa7b6f..ac8972c46 100644 --- a/tuning/automation/LibraryLogicConvertor.py +++ b/tuning/automation/LibraryLogicConvertor.py @@ -29,36 +29,43 @@ import argparse import shutil -# reference/mother lib logics -validLogics={ - 'F8SS_NN': 'aquavanjaram_Cijk_Ailk_Bljk_F8SS_BH.yaml', - 'F8F8S_NN': 'aquavanjaram_Cijk_Ailk_Bljk_F8F8S_BH.yaml', - 'F8HS_NN': 'aquavanjaram_Cijk_Ailk_Bljk_F8HS_BH.yaml', - 'F8F8S_SR_NN':'aquavanjaram_Cijk_Ailk_Bljk_F8F8S_SR_BH.yaml', - 'BBS_NN': 'aquavanjaram_Cijk_Ailk_Bljk_BBS_BH.yaml', - 'BSS_NN': 'aquavanjaram_Cijk_Ailk_Bljk_BSS_BH.yaml', - - 'F8SS_NT': 'aquavanjaram_Cijk_Ailk_Bjlk_F8SS_BH.yaml', - 'F8F8S_NT': 'aquavanjaram_Cijk_Ailk_Bjlk_F8F8S_BH.yaml', - 'F8HS_NT': 'aquavanjaram_Cijk_Ailk_Bjlk_F8HS_BH.yaml', - 'F8F8S_SR_NT':'aquavanjaram_Cijk_Ailk_Bjlk_F8F8S_SR_BH.yaml', - 'BBS_NT': 'aquavanjaram_Cijk_Ailk_Bjlk_BBS_BH.yaml', - 'BSS_NT': 'aquavanjaram_Cijk_Ailk_Bjlk_BSS_BH.yaml', - - 'F8SS_TN': 'aquavanjaram_Cijk_Alik_Bljk_F8SS_BH.yaml', - 'F8F8S_TN': 'aquavanjaram_Cijk_Alik_Bljk_F8F8S_BH.yaml', - 'F8HS_TN': 'aquavanjaram_Cijk_Alik_Bljk_F8HS_BH.yaml', - 'F8F8S_SR_TN':'aquavanjaram_Cijk_Alik_Bljk_F8F8S_SR_BH.yaml', - 'BBS_TN': 'aquavanjaram_Cijk_Alik_Bljk_BBS_BH.yaml', - 'BSS_TN': 'aquavanjaram_Cijk_Alik_Bljk_BSS_BH.yaml', - - 'F8SS_TT': 'aquavanjaram_Cijk_Alik_Bjlk_F8SS_BH.yaml', - 'F8F8S_TT': 'aquavanjaram_Cijk_Alik_Bjlk_F8F8S_BH.yaml', - 'F8HS_TT': 'aquavanjaram_Cijk_Alik_Bjlk_F8HS_BH.yaml', - 'F8F8S_SR_TT':'aquavanjaram_Cijk_Alik_Bjlk_F8F8S_SR_BH.yaml', - 'BBS_TT': 'aquavanjaram_Cijk_Alik_Bjlk_BBS_BH.yaml', - 'BSS_TT': 'aquavanjaram_Cijk_Alik_Bjlk_BSS_BH.yaml' - } +validLogics=[ +'aquavanjaram942_Cijk_Ailk_Bljk_F8SS_BH.yaml', # 'F8SS_NN' +'aquavanjaram942_Cijk_Ailk_Bljk_F8F8S_BH.yaml', # 'F8F8S_NN' +'aquavanjaram942_Cijk_Ailk_Bljk_F8HS_BH.yaml', # 'F8HS_NN' +'aquavanjaram942_Cijk_Ailk_Bljk_F8F8S_SR_BH.yaml', # 'F8F8S_SR_NN' +'aquavanjaram942_Cijk_Ailk_Bljk_BBS_BH.yaml', # 'BBS_NN' +'aquavanjaram942_Cijk_Ailk_Bljk_HHS_BH.yaml', # 'HHS_NN' +'aquavanjaram942_Cijk_Ailk_Bljk_BSS_BH.yaml', # 'BSS_NN' +'aquavanjaram942_Cijk_Ailk_Bljk_HSS_BH.yaml', # 'HSS_NN' + +'aquavanjaram942_Cijk_Ailk_Bjlk_F8SS_BH.yaml', # 'F8SS_NT' +'aquavanjaram942_Cijk_Ailk_Bjlk_F8F8S_BH.yaml', # 'F8F8S_NT' +'aquavanjaram942_Cijk_Ailk_Bjlk_F8HS_BH.yaml', # 'F8HS_NT' +'aquavanjaram942_Cijk_Ailk_Bjlk_F8F8S_SR_BH.yaml', # 'F8F8S_SR_NT' +'aquavanjaram942_Cijk_Ailk_Bjlk_BBS_BH.yaml', # 'BBS_NT' +'aquavanjaram942_Cijk_Ailk_Bjlk_HHS_BH.yaml', # 'HHS_NT' +'aquavanjaram942_Cijk_Ailk_Bjlk_BSS_BH.yaml', # 'BSS_NT' +'aquavanjaram942_Cijk_Ailk_Bjlk_HSS_BH.yaml', # 'HSS_NT' + +'aquavanjaram942_Cijk_Alik_Bljk_F8SS_BH.yaml', # 'F8SS_TN' +'aquavanjaram942_Cijk_Alik_Bljk_F8F8S_BH.yaml', # 'F8F8S_TN' +'aquavanjaram942_Cijk_Alik_Bljk_F8HS_BH.yaml', # 'F8HS_TN' +'aquavanjaram942_Cijk_Alik_Bljk_F8F8S_SR_BH.yaml', # 'F8F8S_SR_TN' +'aquavanjaram942_Cijk_Alik_Bljk_BBS_BH.yaml', # 'BBS_TN' +'aquavanjaram942_Cijk_Alik_Bljk_HHS_BH.yaml', # 'HHS_TN' +'aquavanjaram942_Cijk_Alik_Bljk_BSS_BH.yaml', # 'BSS_TN' +'aquavanjaram942_Cijk_Alik_Bljk_HSS_BH.yaml', # 'HSS_TN' + +'aquavanjaram942_Cijk_Alik_Bjlk_F8SS_BH.yaml', # 'F8SS_TT' +'aquavanjaram942_Cijk_Alik_Bjlk_F8F8S_BH.yaml', # 'F8F8S_TT' +'aquavanjaram942_Cijk_Alik_Bjlk_F8HS_BH.yaml', # 'F8HS_TT' +'aquavanjaram942_Cijk_Alik_Bjlk_F8F8S_SR_BH.yaml', # 'F8F8S_SR_TT' +'aquavanjaram942_Cijk_Alik_Bjlk_BBS_BH.yaml', # 'BBS_TT' +'aquavanjaram942_Cijk_Alik_Bjlk_HHS_BH.yaml', # 'HHS_TT' +'aquavanjaram942_Cijk_Alik_Bjlk_BSS_BH.yaml', # 'BSS_TT' +'aquavanjaram942_Cijk_Alik_Bjlk_HSS_BH.yaml' # 'HSS_TT' +] # family lib logics conversions={ @@ -66,6 +73,8 @@ 'F8F8S' : ['F8B8B8S', 'B8B8S', 'B8F8B8S'], 'F8HS' : ['B8HS', 'F8B8HS', 'B8F8HS'], 'F8F8S_SR': ['F8B8B8S_SR', 'B8B8S_SR', 'B8F8B8S_SR'], + 'HHS' : ['BBS'], + 'HSS' : ['BSS'], 'BBS' : ['HHS'], 'BSS' : ['HSS'] } @@ -116,7 +125,6 @@ 'HSS': [' DataType: 4', ' DestDataType: 0', ' ComputeDataType: 0'] } - def parseArgs(): argParser = argparse.ArgumentParser() @@ -129,14 +137,13 @@ def parseArgs(): return argParser.parse_args() - # This def reads all the files in the liblogic and only selects the reference yamls (see the table) def getLogics(liblogic): logics = [] for yaml in os.listdir(liblogic): - for val in validLogics.values(): + for val in validLogics: if (os.path.isfile(os.path.join(liblogic, yaml)) and yaml == val): logics.append(yaml) break @@ -201,4 +208,3 @@ def main(): if __name__ == "__main__": main() - From 4d63f70f2b7f866afb847fd3ed3d8d66e2cdf758 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Wed, 10 Jan 2024 09:02:42 -0700 Subject: [PATCH 28/51] Temporarily disable failing tests until bug fix is in mainline build (#1860) --- .jenkins/extended.groovy | 3 ++- .jenkins/precheckin.groovy | 3 ++- Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml | 3 +++ Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml | 3 +++ 4 files changed, 10 insertions(+), 2 deletions(-) diff --git a/.jenkins/extended.groovy b/.jenkins/extended.groovy index 44ad373be..62b0498a4 100644 --- a/.jenkins/extended.groovy +++ b/.jenkins/extended.groovy @@ -63,7 +63,8 @@ def runCI = platform, project-> def test_marks = "extended" - commonGroovy.runTestCommand(platform, project, jobName, test_marks) + boolean skipHostTest = true // Skip host test for now, until compiler update is available + commonGroovy.runTestCommand(platform, project, jobName, test_marks, skipHostTest) } buildProject(prj, formatCheck, nodes.dockerArray, compileCommand, testCommand, null) diff --git a/.jenkins/precheckin.groovy b/.jenkins/precheckin.groovy index 5552c359b..9183934a1 100644 --- a/.jenkins/precheckin.groovy +++ b/.jenkins/precheckin.groovy @@ -63,7 +63,8 @@ def runCI = platform, project-> def test_marks = "pre_checkin" - commonGroovy.runTestCommand(platform, project, jobName, test_marks) + boolean skipHostTest = true // Skip host test for now, until compiler update is available + commonGroovy.runTestCommand(platform, project, jobName, test_marks, skipHostTest) } buildProject(prj, formatCheck, nodes.dockerArray, compileCommand, testCommand, null) diff --git a/Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml b/Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml index 5887cccdf..def472522 100644 --- a/Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml +++ b/Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml @@ -1,3 +1,6 @@ +TestParameters: + marks: [xfail] + GlobalParameters: EnqueuesPerSync: 1 LibraryPrintDebug: 0 diff --git a/Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml b/Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml index a6dcda809..fa615a065 100644 --- a/Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml +++ b/Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml @@ -1,3 +1,6 @@ +TestParameters: + marks: [xfail] + GlobalParameters: EnqueuesPerSync: 1 LibraryPrintDebug: 0 From d2924ce5fa010872212d6940ad208d8561dd4cbe Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Thu, 11 Jan 2024 01:42:29 +0900 Subject: [PATCH 29/51] Fix mismatch issue with InitAccOpt + InnerUnroll (#1858) - use const 0 for src1 of MFMA only if index of innerUnrll (iui) is 0 --- Tensile/KernelWriterAssembly.py | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 2637949e0..7e27b8dd9 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -7209,6 +7209,7 @@ def mfmaIter(self, kernel, u, innerUnroll, vregSetIdx, lastKinloop=False, tail=F prevAccIdx = -1 for iui in range(0, innerUnroll): + firstIterIui0 = firstIter and iui == 0 # InnerUnroll case, use const 0 for src1 only if iui == 0 zgemmVaddSrcCheck = [[], [], []] # to avoid generating redundant v_add outer = 1 # swap inner loop and outer loop so that idxA comes outer @@ -7293,9 +7294,9 @@ def mfmaIter(self, kernel, u, innerUnroll, vregSetIdx, lastKinloop=False, tail=F zgemmVaddSrcCheck[arrayIndex].append(ar) imod.addInst(shiftKStr + \ "".join([inst for inst in ccInsts if inst is not None]) + \ - mfmaComponent(self, accStart, accEnd, ar, br, accStart, accEnd, 0, firstIter), "Cr += Ar*Br") + mfmaComponent(self, accStart, accEnd, ar, br, accStart, accEnd, 0, firstIterIui0), "Cr += Ar*Br") src0 = vgpr(ccVgprs[1], numRegistersOut) if ccVgprs[1] else ai - imod.addInst(mfmaComponent(self, accStart+accImOffset, accEnd+accImOffset, src0, br, accStartSrcImg, accEndSrcImg, 0, firstIter), "Ci += %sAi*Br"%("-" if ccVgprs[1] else "")) + imod.addInst(mfmaComponent(self, accStart+accImOffset, accEnd+accImOffset, src0, br, accStartSrcImg, accEndSrcImg, 0, firstIterIui0), "Ci += %sAi*Br"%("-" if ccVgprs[1] else "")) src0 = vgpr(ccVgprs[0], numRegistersOut) if ccVgprs[0] else ai imod.addInst(mfmaComponent(self, accStart, accEnd, src0, bi, accStart, accEnd, accStoreCIdx, False), "Cr += %sAi*Bi"%("-" if ccVgprs[0] else "")) src0 = vgpr(ccVgprs[2], numRegistersOut) if ccVgprs[2] else ar @@ -7313,7 +7314,7 @@ def mfmaIter(self, kernel, u, innerUnroll, vregSetIdx, lastKinloop=False, tail=F waitCode = "" if waits > 0 and (prevAccIdx == accIdx or numMfma == 1): waitCode += inst("s_nop %u"%(waits - 1), "Wait for C") - imod.addCode(shiftKStr + waitCode + mfmaComponent(self, accStart, accEnd, Str0, Str1, accStart, accEnd, accStoreCIdx, firstIter)) + imod.addCode(shiftKStr + waitCode + mfmaComponent(self, accStart, accEnd, Str0, Str1, accStart, accEnd, accStoreCIdx, firstIterIui0)) prevAccIdx = accIdx # clear shiftKStr From 4ed0f4bbf569352d9e59f49ca3a37c30cb99e851 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Fri, 12 Jan 2024 08:23:36 +0900 Subject: [PATCH 30/51] VectorWidthB support, VectorWidth + non SourceSwap support, small bug fix for ClusterLocalRead (#1859) - supported VectorWidthB (added a new parameter VectorWidthB) - supported VectorWidth + non SourceSwap - fixed innacurate vgpr allocation for ClusterLocalRead - added test cases for VectorWidthB, VectorWidth + non SourceSwap - fixed mismatch issue with LdsBlockSizePerPad + MT1(or 0) not power of 2 --- Tensile/Common.py | 7 +- Tensile/Components/ComputeStoreVgprs.py | 12 +- Tensile/Components/LocalRead.py | 8 +- Tensile/Components/LraTileAssignment.py | 6 +- .../Components/NotLocalFullTileElements.py | 7 +- Tensile/Components/ShiftVectorComponents.py | 16 +- Tensile/Components/Signature.py | 8 +- Tensile/KernelWriter.py | 35 ++-- Tensile/KernelWriterAssembly.py | 178 ++++++----------- Tensile/SolutionStructs.py | 185 +++++++++++------- .../local_split_u/hgemm_lsu_mfma.yaml | 52 +++++ .../local_split_u/igemm_lsu_mfma.yaml | 51 +++++ .../local_split_u/sgemm_lsu_mfma.yaml | 53 +++++ 13 files changed, 380 insertions(+), 238 deletions(-) diff --git a/Tensile/Common.py b/Tensile/Common.py index caf361fcb..47c762a00 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -1223,9 +1223,9 @@ def getArchitectureName(gfxName): # Typically matching 16 bytes is good choice since the stores will be optimally coalesced with 16 bytes/WI. # -1 means use the largest vector width up to 128 bits. # Using a VW too large which results in >16bytes/thread isn't supported - # For MFMA non SourceSwap: this parameter didn't take effect - # For MFMA SourceSwap: this parameter only take effect on A buffer for now "VectorWidth": [ -1, 1, 2, 3, 4, 6, 8, 16 ], + # VectorWidth for B (MatrixInstruction only) + "VectorWidthB": [ -1, 1, 2, 4, 8, 16 ], # If 0, store 1 element per instruction. # If 1, store vector-width elements per instruction. @@ -1432,6 +1432,7 @@ def getArchitectureName(gfxName): {"ClusterLocalRead": [ False ] }, {"MaxOccupancy": [ 40 ] }, {"VectorWidth": [ -1 ] }, + {"VectorWidthB": [ -1 ] }, {"VectorStore": [ -1 ] }, {"StoreVectorWidth": [ -1 ] }, {"GlobalLoadVectorWidthA": [ -1 ] }, diff --git a/Tensile/Components/ComputeStoreVgprs.py b/Tensile/Components/ComputeStoreVgprs.py index b1dfbcc38..25c4adb2b 100644 --- a/Tensile/Components/ComputeStoreVgprs.py +++ b/Tensile/Components/ComputeStoreVgprs.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2021-2023 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2021-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -173,7 +173,7 @@ def __call__(self, writer, kernel, divisor, tid0Scale, tid1Scale): # coord 1 : thread part kStr += vectorStaticRemainder(tmpVgpr0, "Serial", matrixInstN, tmpSgpr) - kStr += inst("_v_add_u32", vgpr(tid1), vgpr(tmpVgpr0), vgpr(tid1), "coordination 1 = wave_id1 + tid1") + kStr += inst("_v_add_lshl_u32", vgpr(tid1), vgpr(tmpVgpr0), vgpr(tid1), log2(kernel["VectorWidthB"]), "coordination 1 = vwb *(wave_id1 + tid1)") if kernel["BufferStore"]: # coord 1 : offset part @@ -197,7 +197,7 @@ def __call__(self, writer, kernel, divisor, tid0Scale, tid1Scale): kStr += vectorStaticRemainder(tmpVgpr0, wave_id, kernel["MIWaveGroup"][0], tmpSgpr) kStr += inst("v_mul_lo_u32", vgpr(tmpVgpr0), hex(MIBShape0), vgpr(tmpVgpr0), "wave coordination offset 0") - kStr += inst("_v_add_u32", vgpr(tid0), vgpr(tmpVgpr0), vgpr(tid0), "coordination 0 = wave_id0 + tid0") + kStr += inst("_v_add_lshl_u32", vgpr(tid0), vgpr(tmpVgpr0), vgpr(tid0), log2(kernel["VectorWidthA"]), "coordination 0 = vwa *(wave_id0 + tid0)") if writer.prefetchAcrossPersistent: wg0="PrevWorkGroup0" @@ -289,9 +289,7 @@ def __call__(self, writer, kernel, divisor, tid0Scale, tid1Scale): # coord 1 : wave part kStr += vectorStaticDivide(tmpVgpr0, wave_id, kernel["MIWaveGroup"][0], tmpSgpr) kStr += inst("v_mul_lo_u32", vgpr(tmpVgpr0), hex(MIBShape1), vgpr(tmpVgpr0), "wave coordination offset 1") - kStr += inst("_v_add_u32", vgpr(tid1), vgpr(tmpVgpr0), vgpr(tid1), "coordination 1 = wave_id1 + tid1") - if writer.VectorWidthB > 1: - kStr += staticMultiply(vgpr(tid1), vgpr(tid1), writer.lrvwB, sgpr(tmpSgpr), "coordination 1 *= lrvwB") + kStr += inst("_v_add_lshl_u32", vgpr(tid1), vgpr(tmpVgpr0), vgpr(tid1), log2(kernel["VectorWidthB"]), "coordination 1 = vwb *(wave_id1 + tid1)") if kernel["BufferStore"]: # coord 1 : offset part @@ -308,7 +306,7 @@ def __call__(self, writer, kernel, divisor, tid0Scale, tid1Scale): # coord 0 : thread part kStr += vectorStaticRemainder(tid0, "Serial", matrixInstM, tmpSgpr) - kStr += inst("_v_add_lshl_u32", vgpr(tid0), vgpr(tmpVgpr0), vgpr(tid0), log2(kernel["VectorWidth"]), "coordination 0 = wave_id0 + tid0") + kStr += inst("_v_add_lshl_u32", vgpr(tid0), vgpr(tmpVgpr0), vgpr(tid0), log2(kernel["VectorWidthA"]), "coordination 0 = vwa *(wave_id0 + tid0)") if writer.prefetchAcrossPersistent: wg0="PrevWorkGroup0" diff --git a/Tensile/Components/LocalRead.py b/Tensile/Components/LocalRead.py index 681d2ef03..8edca8896 100644 --- a/Tensile/Components/LocalRead.py +++ b/Tensile/Components/LocalRead.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2021-2023 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2021-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -144,8 +144,9 @@ def __call__(self, writer, bufferIdx, iui, epsi, tP): numOffsets = instruction.numOffsets blockWidth = instruction.blockWidth bpr = writer.bpr - vectorWidthA = kernel["VectorWidth"] if kernel["SourceSwap"] else 1 # TODO: nonSwap VectorWidth - vectorWidthB = writer.VectorWidthB + vectorWidth = kernel["VectorWidth%s"%tc] + vectorWidthA = kernel["VectorWidthA"] + vectorWidthB = kernel["VectorWidthB"] MIWaveGroupShape = [ kernel["MatrixInstM"] * kernel["MatrixInstBM"] * kernel["MIWaveGroup"][0] * vectorWidthA, \ kernel["MatrixInstN"] * kernel["MatrixInstBN"] * kernel["MIWaveGroup"][1] * vectorWidthB] @@ -156,7 +157,6 @@ def __call__(self, writer, bufferIdx, iui, epsi, tP): tileStride = kernel["_DepthULds"] + LdsPad UnrollStride = 1 - vectorWidth = vectorWidthA if (tile01 == 0) else vectorWidthB numVectorsPerTile = kernel["MIWaveTile"][tile01] // vectorWidth numReadsPerVector = vectorWidth if kernel["UnrollMajorLDS%s"%tc] else (vectorWidth * tP["bpe"]) // int(blockWidth * 4) numReadsPerUnroll = ceil(tP["bpe"] * lrvw / int(blockWidth * 4)) if kernel["UnrollMajorLDS%s"%tc] else kernel["MIInputPerThread"] # bytes/register diff --git a/Tensile/Components/LraTileAssignment.py b/Tensile/Components/LraTileAssignment.py index 9ea978777..438714d08 100644 --- a/Tensile/Components/LraTileAssignment.py +++ b/Tensile/Components/LraTileAssignment.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2021-2022 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2021-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -120,9 +120,7 @@ def __call__(self, writer, kernel, tP): else: dividedForBlkId = (kernel["MatrixInstN"] * kernel["MatrixInstBN"]) if (tile01 == 0) else kernel["MatrixInstN"] dividedForWaveId = waveWidth if (tile01 == 0) else (waveWidth * kernel["MIWaveGroup"][0]) - vectorWidth = kernel["VectorWidth"] if ((tile01 == 0) and kernel["SourceSwap"]) else 1 # TODO: nonSwap VectorWidth - if tP["isB"] : - vectorWidth = writer.VectorWidthB + vectorWidth = kernel["VectorWidth%s"%tc] # strider for each type of index mt = kernel["MacroTile%u" % tile01] diff --git a/Tensile/Components/NotLocalFullTileElements.py b/Tensile/Components/NotLocalFullTileElements.py index 1d1e6cb29..4bed6dc65 100644 --- a/Tensile/Components/NotLocalFullTileElements.py +++ b/Tensile/Components/NotLocalFullTileElements.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2021-2023 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2021-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -88,9 +88,8 @@ def __call__(self, writer, kernel, edge): totalTT0 = totalTT0 if kernel["SourceSwap"] else (totalTT0 * outputsPerThread) totalTT1 = (totalTT1 * outputsPerThread) if kernel["SourceSwap"] else totalTT1 - vectorWidth0 = kernel["VectorWidth"] if kernel["SourceSwap"] else 1 * kernel["MIOutputVectorWidth"] # VW for non SourceSwap not supported yet - vwB = writer.VectorWidthB - vectorWidth1 = vwB * kernel["MIOutputVectorWidth"] if kernel["SourceSwap"] else vwB + vectorWidth0 = kernel["VectorWidthA"] if kernel["SourceSwap"] else kernel["VectorWidthA"] * kernel["MIOutputVectorWidth"] + vectorWidth1 = kernel["VectorWidthB"] * kernel["MIOutputVectorWidth"] if kernel["SourceSwap"] else kernel["VectorWidthB"] for tt1 in range(0, totalTT1//vectorWidth1): for vc1 in range(0, vectorWidth1): diff --git a/Tensile/Components/ShiftVectorComponents.py b/Tensile/Components/ShiftVectorComponents.py index 037130cd9..5503294b3 100644 --- a/Tensile/Components/ShiftVectorComponents.py +++ b/Tensile/Components/ShiftVectorComponents.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2021-2023 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2021-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -264,21 +264,11 @@ def __call__(self, writer, kernel, tP): use partial thread algorithm """ - # TODO: use this for non SourceSwap for B? - # this part can support non SourceSwap for B - # But let non SourceSwap for B go original shiftptr path - # return here only for LSU=1. LSU>1 case needs the code below - if (not kernel["SourceSwap"]) and tP["isB"] and kernel["LocalSplitU"]==1: - return "" - # common parameter + tc = tP["tensorChar"] glvw = tP["glvw"] numThreadInWave = writer.kernel["WavefrontSize"] - vectorWidth = kernel["VectorWidth"] if (kernel["SourceSwap"] and tP["isA"]) else 1 - # support for VectorWidthB - # use lrvwB as vectorWidth in B case - if tP["isB"]: - vectorWidth = writer.VectorWidthB + vectorWidth = kernel["VectorWidth%s"%tc] # use to handle MatrixInst 4x4 matrixInstM = kernel["MatrixInstM"] * kernel["MatrixInstBM"] if (kernel["MatrixInstM"] == 4) else kernel["MatrixInstM"] diff --git a/Tensile/Components/Signature.py b/Tensile/Components/Signature.py index 2a5ca9b28..665f2bef2 100644 --- a/Tensile/Components/Signature.py +++ b/Tensile/Components/Signature.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2020-2022 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2020-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -159,7 +159,11 @@ def __call__(self, writer): kStr += writer.comment3("Optimizations and Config:") kStr += writer.comment1("ThreadTile= %u x %u" % (kernel["ThreadTile0"], kernel["ThreadTile1"])) kStr += writer.comment1("SubGroup= %u x %u" % (kernel["SubGroup0"], kernel["SubGroup1"])) - kStr += writer.comment1("VectorWidth=%u" % (kernel["VectorWidth"])) + if kernel["EnableMatrixInstruction"]: + kStr += writer.comment1("VectorWidthA=%u" % (kernel["VectorWidthA"])) + kStr += writer.comment1("VectorWidthB=%u" % (kernel["VectorWidthB"])) + else: + kStr += writer.comment1("VectorWidth=%u" % (kernel["VectorWidth"])) glvw = kernel["GlobalLoadVectorWidthA"] glvwAStr = "GlobalLoadVectorWidthA=%f"%glvw if glvw < 1 else "GlobalLoadVectorWidthA=%u"%glvw glvw = kernel["GlobalLoadVectorWidthB"] diff --git a/Tensile/KernelWriter.py b/Tensile/KernelWriter.py index ca9fbd6ce..19d36082b 100644 --- a/Tensile/KernelWriter.py +++ b/Tensile/KernelWriter.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -3859,9 +3859,6 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): vwa = kernel["GlobalLoadVectorWidthA"] vwb = kernel["GlobalLoadVectorWidthB"] - # allow LocalReadVectorWidthB for TLUB + MatrixInstruction - self.VectorWidthB = kernel["VectorWidthB"] - # lrvwTileA,B # lrvwTileA,B > 1 is to use wider local read + v_perm # MIInputPerThread > 1 case, we need MIInputPerThread continuous K elements @@ -3891,12 +3888,13 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): # VectorWidthA,B > 1 self.lrvwTileA = 1 self.lrvwTileB = 1 - if kernel["EnableMatrixInstruction"] and kernel["MIInputPerThread"] > 1 and\ - kernel["SourceSwap"] and kernel["VgprForLocalReadPacking"] and kernel["ClusterLocalRead"]: + self.useWiderLocalReadB = False + if kernel["EnableMatrixInstruction"] and kernel["MIInputPerThread"] > 1 and \ + kernel["VgprForLocalReadPacking"] and kernel["ClusterLocalRead"]: if (not kernel["UnrollMajorLDSA"]): - self.lrvwTileA = min(kernel["MIInputPerThread"], kernel["VectorWidth"]) # should not exceed MIInputPerThread + self.lrvwTileA = min(kernel["MIInputPerThread"], kernel["VectorWidthA"]) # should not exceed MIInputPerThread if (not kernel["UnrollMajorLDSB"]): - self.lrvwTileB = min(kernel["MIInputPerThread"], self.VectorWidthB) # should not exceed MIInputPerThread + self.lrvwTileB = min(kernel["MIInputPerThread"], kernel["VectorWidthB"]) # should not exceed MIInputPerThread self.numItersPLR = kernel["PrefetchLocalRead"]%kernel["LoopIters"] self.numVgprBuffer = kernel["LoopIters"] if kernel["PrefetchLocalRead"] > kernel["LoopIters"] else kernel["PrefetchLocalRead"] @@ -3908,20 +3906,23 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): self.lrvwA = kernel["MIInputPerThread"] if kernel["DirectToVgprA"]: # DirectToVgprA case, ignore LocalReadVectorWidth and use GlobalLoadVectorWidth instead. - self.lrvwA = max(kernel["MIInputPerThread"], vwa) + self.lrvwA = vwa else: self.lrvwA = 1 if kernel["UnrollMajorLDSB"]: self.lrvwB = kernel["LocalReadVectorWidth"] else: if kernel["EnableMatrixInstruction"]: + # MI + UMLDS, we need minimum of MIInputPerThread for lrvw + self.lrvwB = kernel["MIInputPerThread"] if kernel["DirectToVgprB"]: # DirectToVgprB case, ignore LocalReadVectorWidth and use GlobalLoadVectorWidth instead. - self.lrvwB = max(kernel["MIInputPerThread"], vwb) - else: + self.lrvwB = vwb + elif kernel["DirectToVgprA"] and kernel["ProblemType"]["TLUA"]: # MI + UMLDS, we need minimum of MIInputPerThread for lrvw - # self.VectorWidthB > MIInputPerThread case, use self.VectorWidthB as lrvwB - self.lrvwB = max(kernel["MIInputPerThread"], self.VectorWidthB) + # DirectToVgprA + TLUA + UnrollMajorLDSB=False case, allow wider LocalReadVectorWidth + self.lrvwB = kernel["LocalReadVectorWidth"] + self.useWiderLocalReadB = self.lrvwB > kernel["MIInputPerThread"] else: self.lrvwB = 1 @@ -3955,7 +3956,7 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): else: # read components, write components self.readTileDimComponentsA = False # Scalar self.readTileDimVectorA = False # Scalar - self.readUnrollDimComponentsA = kernel["VectorWidth"] > 1 # Components + self.readUnrollDimComponentsA = kernel["VectorWidthA"] > 1 # Components self.readUnrollDimVectorA = False # Components self.numReadsTileVecCompA = 1 self.numReadsUnrollVecCompA = vwa @@ -3970,7 +3971,7 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): self.numReadsUnrollVecCompA = vwa self.numReadsTileVecCompA = 1 else: # read components, write vectors - self.readTileDimComponentsA = kernel["VectorWidth"] > 1 # Components + self.readTileDimComponentsA = kernel["VectorWidthA"] > 1 # Components self.readTileDimVectorA = False # Components self.readUnrollDimComponentsA = False # Scalar self.readUnrollDimVectorA = False # Scalar @@ -4063,7 +4064,7 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): else: self.readTileDimComponentsB = False # Scalar self.readTileDimVectorB = False # Scalar - self.readUnrollDimComponentsB = kernel["VectorWidth"] > 1 # Components + self.readUnrollDimComponentsB = kernel["VectorWidthB"] > 1 # Components self.readUnrollDimVectorB = False # Components # NEW self.numReadsTileVecCompB = 1 @@ -4079,7 +4080,7 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): self.numReadsUnrollVecCompB = vwb self.numReadsTileVecCompB = 1 else: - self.readTileDimComponentsB = kernel["VectorWidth"] > 1 # Components + self.readTileDimComponentsB = kernel["VectorWidthB"] > 1 # Components self.readTileDimVectorB = False # Components self.readUnrollDimComponentsB = False # Scalar self.readUnrollDimVectorB = False # Scalar diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 7e27b8dd9..ad39ae82a 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -1202,18 +1202,18 @@ def initKernel(self, kernel, tPA, tPB ): ######################################## # localRead A - localReadWidth = (kernel["VectorWidth"] * tPA["bpe"]) // self.bpr + localReadWidth = (kernel["VectorWidthA"] * tPA["bpe"]) // self.bpr if kernel["EnableMatrixInstruction"]: localReadWidth = self.lrvwTileA * tPA["bpe"] / self.bpr if kernel["UnrollMajorLDSA"] or kernel["DirectToVgprA"]: - # DTVA case, no local read is actually generated, but this still affects (dummy) local read sccheduling for DTVA + # DTVA case, no local read is actually generated, but this still affects (dummy) local read scheduling for DTVA localReadWidth = (self.lrvwA * tPA["bpe"]) // self.bpr #localReadStridePerpendicular = 0 localRead2Perpendicular = False self.localReadStrideCoalescedA = \ kernel["ThreadTile0"] * tPA["bpe"]//self.bpr - self.localRead2CoalescedA = kernel["ThreadTile0"]//kernel["VectorWidth"] > 1 + self.localRead2CoalescedA = kernel["ThreadTile0"]//kernel["VectorWidthA"] > 1 self.localReadInstructionIdxA = \ self.selectMemoryInstruction("LocalRead", localReadWidth, \ kernel["LocalRead2A"], \ @@ -1226,17 +1226,18 @@ def initKernel(self, kernel, tPA, tPB ): ######################################## # localRead B - localReadWidth = (kernel["VectorWidth"] * tPB["bpe"]) // self.bpr + localReadWidth = (kernel["VectorWidthB"] * tPB["bpe"]) // self.bpr if kernel["EnableMatrixInstruction"]: localReadWidth = self.lrvwTileB * tPB["bpe"] / self.bpr - if kernel["UnrollMajorLDSB"] or self.VectorWidthB > 1: + if kernel["UnrollMajorLDSB"] or kernel["DirectToVgprB"] or (kernel["DirectToVgprA"] and self.useWiderLocalReadB): + # DTVB case, no local read is actually generated, but this still affects (dummy) local read scheduling for DTVB localReadWidth = (self.lrvwB * tPB["bpe"]) // self.bpr #localReadStridePerpendicular = 0 localRead2Perpendicular = False self.localReadStrideCoalescedB = \ kernel["ThreadTile1"] * tPB["bpe"]//self.bpr - self.localRead2CoalescedB = kernel["ThreadTile1"]//kernel["VectorWidth"] > 1 + self.localRead2CoalescedB = kernel["ThreadTile1"]//kernel["VectorWidthB"] > 1 self.localReadInstructionIdxB = \ self.selectMemoryInstruction("LocalRead", localReadWidth, \ kernel["LocalRead2B"], \ @@ -1320,14 +1321,24 @@ def initKernel(self, kernel, tPA, tPB ): self.numElemPerBprA = (4 / tPA["bpe"]) needVgprForPack = self.needPackA and kernel["VgprForLocalReadPacking"] if needVgprForPack: - valuBlocksPack = (int(self.numElemPerBprA) - 1) if self.lrvwTileA == 1 else self.lrvwTileA + if self.lrvwTileA > 1: + self.numVgprValuA //= (1+PLR) + numLoadPerReg = max(1, int(self.numElemPerBprA)//self.lrvwTileA) + valuBlocksPack = (1+PLR) * numLoadPerReg + else: + valuBlocksPack = (int(self.numElemPerBprA) - 1) self.numVgprValuPackA = self.numVgprValuA * valuBlocksPack self.numVgprValuPackB =0 self.numElemPerBprB = (4 / tPB["bpe"]) needVgprForPack = self.needPackB and kernel["VgprForLocalReadPacking"] if needVgprForPack: - valuBlocksPack = (int(self.numElemPerBprB) - 1) if self.lrvwTileB == 1 else self.lrvwTileB + if self.lrvwTileB > 1: + self.numVgprValuB //= (1+PLR) + numLoadPerReg = max(1, int(self.numElemPerBprB)//self.lrvwTileB) + valuBlocksPack = (1+PLR) * numLoadPerReg + else: + valuBlocksPack = (int(self.numElemPerBprB) - 1) self.numVgprValuPackB = self.numVgprValuB * valuBlocksPack #################################### @@ -1644,9 +1655,9 @@ def initKernel(self, kernel, tPA, tPB ): # need proper alignment for G2LC vgprIdx = ((vgprIdx+Calign - 1)//Calign)*Calign self.startVgprG2LC = vgprIdx - vgprIdx += (kernel["VectorWidth"] * tPA["bpe"]) // self.bpr + vgprIdx += (kernel["VectorWidthA"] * tPA["bpe"]) // self.bpr self.startVgprL2GC = vgprIdx - vgprIdx += ((kernel["VectorWidth"] * tPA["bpe"]) // self.bpr) + vgprIdx += ((kernel["VectorWidthA"] * tPA["bpe"]) // self.bpr) if not kernel["AtomicAddC"] and kernel["ProblemType"]["UseBeta"]: self.GlobalReadOffsetC = vgprIdx vgprIdx +=1 @@ -2052,7 +2063,11 @@ def initKernel(self, kernel, tPA, tPB ): # DTVA case, no local read is actually generated, but this still affects (dummy) local read scheduling for DTVA numA //= self.lrvwA if kernel["InnerUnroll"] >= self.numReadsIterCoalescedB: - numB //= (self.numReadsIterCoalescedB * self.VectorWidthB) + numB //= self.numReadsIterCoalescedB + if self.useWiderLocalReadB: + # use wider local read for UnrollMajorLDSB=False + # numB needs to be divided by lrvwB + numB //= self.lrvwB else: numB = kernel["InnerUnroll"]*(kernel["ThreadTile1"] // kernel["VectorWidth"]) // tPB["localReadInstruction"].numOffsets numA = kernel["InnerUnroll"]*(kernel["ThreadTile0"] // kernel["VectorWidth"]) // tPA["localReadInstruction"].numOffsets @@ -4068,7 +4083,9 @@ def graTileAssignment(self, kernel, tP): dividedForBlkId = kernel["MatrixInstM"] if (tile01 == 0) else (kernel["MatrixInstM"] * kernel["MatrixInstBM"]) else: dividedForBlkId = (kernel["MatrixInstN"] * kernel["MatrixInstBN"]) if (tile01 == 0) else kernel["MatrixInstN"] - vectorWidth = 1 # kernel["VectorWidth"] if ((tile01 == 0) and kernel["SourceSwap"]) else 1 # TODO: nonSwap VectorWidth + # TLU case, glvw and vw are applied to the same direction. No need to apply both. + # non TLU case, glvw and vw are applied to the different direction. We need to apply vw here. + vectorWidth = 1 if tP["tlu"] else kernel["VectorWidth%s"%tc] strideTile = 1 # tentative strideBlock = kernel["MatrixInstM"] * strideTile strideWave = kernel["MatrixInstM"] * num1DBlocks * strideTile * vectorWidth @@ -4096,6 +4113,8 @@ def graTileAssignment(self, kernel, tP): else: # comment only because bnIdx = bnIdx % num1DBlocks(1) = 0 kStr += instCommentOnly("2. block offset: bnIdx = bnIdx %% num1DBlocks(%u) is 0. do nothing" % num1DBlocks) + kStr += staticMultiply(vgpr(rReg), vgpr(rReg), vectorWidth, sgpr(tmpSgpr), \ + "4. apply VectorWidth: bnOffset = bnOffset * vw(%u)" % vectorWidth) # unroll offset # need division for qReg kStr += vectorStaticDivide(qReg, qReg, dividendForKId, tmpSgpr, \ @@ -4186,10 +4205,6 @@ def graTileAssignment(self, kernel, tP): else: kStr += self.comment1("gro-unroll *= glvw") kStr += vectorStaticMultiply(uReg, uReg, tP["glvw"], tmpSgpr) - if forceSwap and tc == "A": - # in this case, need to multiply vw to gro-tile - kStr += self.comment1("gro-tile *= vw") - kStr += staticMultiply(vgpr(tReg), vgpr(tReg), kernel["VectorWidth"], sgpr(tmpSgpr)) if not self.groOffsetInMacroTile: # Buffer Load will set the SRD to start of the MacroTile @@ -4308,12 +4323,12 @@ def graTileOffsets(self, kernel, tP): tP["vgprPackedOffsets"] = self.vgprPool.checkOut(numExtraPackedOffsetsPerTile * numTileOffsets, "vgprPackedOffsets", self.preventVgprOverflowDuringNewTile) strideIdx = tP["lsc"] if tP["tlu"] else tP["lsp"] stride = kernel[strideIdx] - # adjustment for DirectToVgpr + tlu=False + VW > 1 case (A only) + # adjustment for DirectToVgpr + tlu=False + VW > 1 case strideInterleave = False - if kernel["DirectToVgpr%c"%tc] and (not tP["tlu"]) and kernel["VectorWidth"] > 1 and tc == "A": + if kernel["DirectToVgpr%c"%tc] and (not tP["tlu"]) and kernel["VectorWidth%s"%tc] > 1: strideInterleave = True - stride = stride * kernel["VectorWidth"] - (kernel["VectorWidth"] - 1) - strideMask = (kernel["VectorWidth"] - 1) + stride = stride * kernel["VectorWidth%s"%tc] - (kernel["VectorWidth%s"%tc] - 1) + strideMask = (kernel["VectorWidth%s"%tc] - 1) bpeOffset = 1 if tP["glvw"] >= 1 else tP["bpe"] # glvw<1 case, need to multiply strideValue by bpe if tP["rtc"]: @@ -9945,7 +9960,6 @@ def localSplitULocalWriteOffsetAddressMFMA(self, kernel): # constant MIBShape0 = kernel["MatrixInstM"] * kernel["MatrixInstBM"] MIBShape1 = kernel["MatrixInstN"] * kernel["MatrixInstBN"] - VectorWidth = kernel["VectorWidth"] if kernel["SourceSwap"] else 1 if kernel["SourceSwap"]: # SourceSwap case, use M @@ -9995,8 +10009,7 @@ def localSplitULocalWriteOffsetAddressMFMA(self, kernel): kStr += inst("_v_add_u32", vgpr(tid1), vgpr(tmpVgpr0), vgpr(tid1), "coordination 1 = wave_id1 + tid1") # adjustment for B vector - if self.VectorWidthB > 1: - kStr += staticMultiply(vgpr(tid1), vgpr(tid1), self.lrvwB, sgpr(tmpSgpr), "coordination 1 *= lrvwB") + kStr += staticMultiply(vgpr(tid1), vgpr(tid1), kernel["VectorWidthB"], sgpr(tmpSgpr), "coordination 1 *= vwB") # tid1 *= MT0*bpe kStr += staticMultiply(vgpr(tid1), vgpr(tid1), kernel["MacroTile0"]*self.bpeCinternal, sgpr(tmpSgpr), "coordination 1 *= (MT0*bpe)") @@ -10029,8 +10042,8 @@ def localSplitULocalWriteOffsetAddressMFMA(self, kernel): kStr += inst("v_mul_lo_u32", vgpr(tmpVgpr0), hex(MIBShape0), vgpr(tmpVgpr0), "wave coordination offset 0") kStr += inst("_v_add_u32", vgpr(tid0), vgpr(tmpVgpr0), vgpr(tid0), "tid0 += wave coordination offset 0") - # tid0 *= VW*bpe - kStr += staticMultiply(vgpr(tid0), vgpr(tid0), VectorWidth*self.bpeCinternal, sgpr(tmpSgpr), "coordination 0 *= (VW*bpe)") + # tid0 *= VWA*bpe + kStr += staticMultiply(vgpr(tid0), vgpr(tid0), kernel["VectorWidthA"]*self.bpeCinternal, sgpr(tmpSgpr), "coordination 0 *= (VWA*bpe)") # tid = tid0 + tid1 kStr += inst("_v_add_u32", vgpr(tid0), vgpr(tid1), vgpr(tid0), "tid = tid0 + tid1") @@ -10070,7 +10083,6 @@ def lsuMFMAWriteElements(self, kernel, gwvw, elements): coordOffset1 = 0 - vc1Scale = self.VectorWidthB MIOutputVectorWidth = kernel["MIOutputVectorWidth"] MFMAContinuousOutputs = MIOutputVectorWidth if kernel["SourceSwap"] else 1 OutputsPerMIMN = (matrixInstM * matrixInstN // kernel["WavefrontSize"]) if kernel["SourceSwap"] else 1 @@ -10086,9 +10098,8 @@ def lsuMFMAWriteElements(self, kernel, gwvw, elements): coordOffset1 = eIdx1 * (WavefrontSize // matrixInstN) * MFMAContinuousOutputs coordOffset1 += bIdx1 * matrixInstN coordOffset1 += wtIdex * matrixInstN * matrixInstBN * kernel["MIWaveGroup"][1] - coordOffset1 = coordOffset1 * vc1Scale + vc1 + coordOffset1 = coordOffset1 * kernel["VectorWidthB"] + vc1 - vectorWidth = kernel["VectorWidth"] if kernel["SourceSwap"] else 1 # TODO: nonSwap VectorWidth MFMAContinuousOutputs = 1 if kernel["SourceSwap"] else MIOutputVectorWidth OutputsPerMIMN = 1 if kernel["SourceSwap"] else matrixInstM * matrixInstN // WavefrontSize @@ -10099,10 +10110,10 @@ def lsuMFMAWriteElements(self, kernel, gwvw, elements): remain_d0 = remain_d0 // matrixInstBM wtIdex = remain_d0 % kernel["MIWaveTile"][0] - coordOffset0 = eIdx0 * vectorWidth * (WavefrontSize // matrixInstM) * MFMAContinuousOutputs - coordOffset0 += bIdx0 * vectorWidth * matrixInstM - coordOffset0 += wtIdex * vectorWidth * matrixInstM * matrixInstBM * kernel["MIWaveGroup"][0] - coordOffset0 += vc0 + coordOffset0 = eIdx0 * (WavefrontSize // matrixInstM) * MFMAContinuousOutputs + coordOffset0 += bIdx0 * matrixInstM + coordOffset0 += wtIdex * matrixInstM * matrixInstBM * kernel["MIWaveGroup"][0] + coordOffset0 = coordOffset0 * kernel["VectorWidthA"] + vc0 # Step 2: generate move code from acc to vgpr (no move necessary for MIArchVgpr case (some exceptions)) # loop over scalars within one store instruction @@ -11140,7 +11151,7 @@ def __init__(self, kernelWriter, kernel, gwvw, edge, beta, atomic, elements, isW # # Also create an AddrCalc for each memory operation. ############################################################################## - def setupStoreElementsForBatch(self, kernel, gwvw, batchElements, batchElementSgprs, preventOverflow, VectorWidthB, isWorkspace=False): + def setupStoreElementsForBatch(self, kernel, gwvw, batchElements, batchElementSgprs, preventOverflow, isWorkspace=False): self.elementAddr = [] self.elementData = [] # VGPR to use for element data, needed for atomic or beta @@ -11177,7 +11188,6 @@ def setupStoreElementsForBatch(self, kernel, gwvw, batchElements, batchElementSg coordOffset1 = 0 if kernel["EnableMatrixInstructionStore"]: - vc1Scale = VectorWidthB MIOutputVectorWidth = kernel["MIOutputVectorWidth"] MFMAContinuousOutputs = MIOutputVectorWidth if kernel["SourceSwap"] else 1 OutputsPerMIMN = (matrixInstM * matrixInstN // self.kernel["WavefrontSize"]) if kernel["SourceSwap"] else 1 @@ -11192,7 +11202,7 @@ def setupStoreElementsForBatch(self, kernel, gwvw, batchElements, batchElementSg coordOffset1 = eIdx1 * (self.kernel["WavefrontSize"] // matrixInstN) * MFMAContinuousOutputs coordOffset1 += bIdx1 * matrixInstN coordOffset1 += wtIdex * matrixInstN * matrixInstBN * kernel["MIWaveGroup"][1] - coordOffset1 = coordOffset1 * vc1Scale + vc1 + coordOffset1 = coordOffset1 * kernel["VectorWidthB"] + vc1 else: if kernel["LocalSplitU"] > 1: strideD1 = (kernel["NumThreads"]*kernel["VectorWidth"]//kernel["MacroTile0"]) @@ -11205,7 +11215,6 @@ def setupStoreElementsForBatch(self, kernel, gwvw, batchElements, batchElementSg # gpr and offset assignments for element coordOffset0 = 0 if kernel["EnableMatrixInstructionStore"]: - vectorWidth = kernel["VectorWidth"] if kernel["SourceSwap"] else 1 # TODO: nonSwap VectorWidth MFMAContinuousOutputs = 1 if kernel["SourceSwap"] else kernel["MIOutputVectorWidth"] OutputsPerMIMN = 1 if kernel["SourceSwap"] else matrixInstM * matrixInstN // self.kernel["WavefrontSize"] @@ -11216,10 +11225,10 @@ def setupStoreElementsForBatch(self, kernel, gwvw, batchElements, batchElementSg remain_d0 = remain_d0 // matrixInstBM wtIdex = remain_d0 % kernel["MIWaveTile"][0] - coordOffset0 = eIdx0 * vectorWidth * (self.kernel["WavefrontSize"] // matrixInstM) * MFMAContinuousOutputs - coordOffset0 += bIdx0 * vectorWidth * matrixInstM - coordOffset0 += wtIdex * vectorWidth * matrixInstM * matrixInstBM * kernel["MIWaveGroup"][0] - coordOffset0 += vc0 + coordOffset0 = eIdx0 * (self.kernel["WavefrontSize"] // matrixInstM) * MFMAContinuousOutputs + coordOffset0 += bIdx0 * matrixInstM + coordOffset0 += wtIdex * matrixInstM * matrixInstBM * kernel["MIWaveGroup"][0] + coordOffset0 = coordOffset0 * kernel["VectorWidth"] + vc0 else: coordOffset0 = d0 * kernel["SubGroup0"]*kernel["VectorWidth"] + vc0 @@ -11296,9 +11305,9 @@ def setupStoreElementsForBatch(self, kernel, gwvw, batchElements, batchElementSg #print "Edge=", edge, element sumIdx = 0 if kernel["LocalSplitU"] > 1: - sumIdx = kw.startVgprValuC + vc0 + d1*kernel["VectorWidth"] + sumIdx = kw.startVgprValuC + vc0 + d1*kernel["VectorWidthA"] else: - bestVw = kernel["VectorWidth"] + bestVw = kernel["VectorWidthA"] elementsLoadedPerVw = kernel["NumThreads"] * bestVw elementsLoadedPerbestVw = kernel["NumThreads"] * kernel["StoreVectorWidth"] @@ -11658,60 +11667,6 @@ def emitAddressSetupCode(self, kernel, ss, tc, tmpVgpr, tmpS01, edge, beta, atom elif len(kernel["PackedC1IndicesX"]) > 1: kStr += self.kernelWriter.extractPackedCoord1ToRowStart(kernel, kernel["PackedC1IndicesX"] , self.coord1Vgpr, 'D') - # Shift Pointer for MFMA: - # For MFMA shift pointer, correct data is stored in another thread. - # Therefore, MFMA cannot use v_mov to amend store data - # It needs to modify the coord1 of thread directly. - if (not kernel["SourceSwap"]) and (not kernel["GuaranteeNoPartialB"]) and kw.readTileDimVectorB and kernel["EnableMatrixInstructionStore"] and edge and (tc =='C' or not beta): - (d1,d0,vc1,vc0) = self.element - if (d1 == vc1 == d0 == vc0 == 0) or self.newCoord1: - sgprCnt = self.kernelWriter.laneSGPRCount - waveSize = kernel["WavefrontSize"] - packedC1 = kernel["PackedC1IndicesX"] - strideC1 = "StrideC%s" % (kw.indexChars[packedC1[0]]) - strideD1 = "StrideD%s" % (kw.indexChars[packedC1[0]]) - - kStr += kw.comment("shift vector components d1") - vw = kernel["GlobalLoadVectorWidthB"] - vTmp1 = tmpVgpr - vTmp2 = tmpVgpr+1 - sTmp1 = tmpS01 - sTmp2 = tmpS01+sgprCnt - # check conditions - kStr += inst("v_bfi_b32", vgpr(vTmp1), vw-1, 0, vgpr(self.coord1Vgpr), "coord1 & ~(vw-1)") - kStr += inst("v_bfi_b32", vgpr(vTmp2), vw-1, 0, sgpr("SizesFree+%u"%kw.tPB["idx"]), "sizeFree & ~(vw-1)") - kStr += inst("v_cmp_eq_u32", sgpr(sTmp1,sgprCnt), vgpr(vTmp1), vgpr(vTmp2), "if coord1 is in edge glvw") - kStr += inst("v_and_b32", vgpr(vTmp2), sgpr("SizesFree+%u"%kw.tPB["idx"]), vw-1, "sizeFree mod VW") - kStr += inst("v_cmp_gt_u32", sgpr(sTmp2,sgprCnt), vgpr(vTmp2), 0, "this problem is not multiple size of glvw") - kStr += inst("s_and_b{}".format(waveSize), sgpr(sTmp1,sgprCnt), sgpr(sTmp1,sgprCnt), sgpr(sTmp2,sgprCnt), "AND both conditions") - # calculate new coord - kStr += inst("_v_add_u32", vgpr(vTmp1), vgpr(self.coord1Vgpr), vgpr(vTmp2), "shift coord1") - kStr += inst("v_bfi_b32", vgpr(vTmp1), vw-1, vgpr(vTmp1), sgpr("SizesFree+%u"%kw.tPB["idx"]), "new coord1 = (shift coord1 & (vw-1)) | (sizeFree & ~(vw-1))") - kStr += inst("_v_sub_i32", vgpr(vTmp2), vgpr(vTmp1), vgpr(self.coord1Vgpr), "shift how many column") - kStr += inst("v_cndmask_b32", vgpr(self.coord1Vgpr), vgpr(self.coord1Vgpr), vgpr(vTmp1), \ - sgpr(sTmp1,sgprCnt), "set new coord1 if meet conditions" ) - - if kernel["BufferStore"]: - kStr += inst("v_mad_i32_i24", vgpr(vTmp1), sgpr(strideC1), vgpr(vTmp2), vgpr(kw.cinRowPtr), \ - "new rowStart address += shift column * StridesC") - kStr += inst("v_cndmask_b32", vgpr(kw.cinRowPtr), vgpr(kw.cinRowPtr), vgpr(vTmp1), sgpr(sTmp1,sgprCnt), \ - "set new rowStart if meet conditions" ) - kStr += inst("v_mad_i32_i24", vgpr(vTmp1), sgpr(strideD1), vgpr(vTmp2), vgpr(kw.coutRowPtr), \ - "new rowStart address += shift column * StridesD") - kStr += inst("v_cndmask_b32", vgpr(kw.coutRowPtr), vgpr(kw.coutRowPtr), vgpr(vTmp1), sgpr(sTmp1,sgprCnt), \ - "set new rowStart if meet conditions" ) - - if kernel["StoreRemapVectorWidth"]: - ldsPad = max(kernel["StoreRemapVectorWidth"],kernel["MIOutputVectorWidth"]) - kStr += inst("v_mov_b32", vgpr(vTmp1), hex((kernel["MacroTile0"]+ldsPad)*kw.bpeCexternal), \ - "lds byte stride = (MT0 + PAD) * bpe") - kStr += inst("v_mad_i32_i24", vgpr(vTmp1), vgpr(vTmp1), vgpr(vTmp2), vgpr(kw.storeRemapLW), \ - "new lds write address += shift column * Lds byte Stride") - kStr += inst("v_cndmask_b32", vgpr(kw.storeRemapLW), vgpr(kw.storeRemapLW), vgpr(vTmp1), \ - sgpr(sTmp1,sgprCnt), "set new rowStart if meet conditions" ) - - kStr += "\n" - # calculate global load offset # this has to be done after calculating new coord1 if not kernel["BufferStore"] and (tc == 'D' or (tc == 'C' and beta)): @@ -11921,8 +11876,7 @@ def fixupBatch(self, kernel, ss, batchIdx, edge, gwvw, \ # allow expanding vgpr pool for OptNLL preventOverflow = True #(not isOptNLL) - ss.setupStoreElementsForBatch(kernel, gwvw, batchElements, batchElementSgprs, preventOverflow=preventOverflow, \ - VectorWidthB=self.VectorWidthB, isWorkspace=True) + ss.setupStoreElementsForBatch(kernel, gwvw, batchElements, batchElementSgprs, preventOverflow=preventOverflow, isWorkspace=True) loadsIssued = 0 storesIssued = 0 @@ -12893,8 +12847,7 @@ def partialsWriteBatch(self, kernel, ss, batchIdx, applyAlpha, beta, edge, atomi # allow expanding vgpr pool for OptNLL preventOverflow = (not isOptNLL) - ss.setupStoreElementsForBatch(kernel, gwvw, batchElements, batchElementSgprs, preventOverflow=preventOverflow, \ - VectorWidthB=self.VectorWidthB, isWorkspace=True) + ss.setupStoreElementsForBatch(kernel, gwvw, batchElements, batchElementSgprs, preventOverflow=preventOverflow, isWorkspace=True) storesIssued = 0 tmpS01 = tmpSgpr # scratch sgprs @@ -14017,8 +13970,7 @@ def globalWriteBatch(self, kernel, ss, batchIdx, applyAlpha, beta, edge, atomic, # allow expanding vgpr pool for OptNLL preventOverflow = (not isOptNLL) - ss.setupStoreElementsForBatch(kernel, gwvw, batchElements, batchElementSgprs, preventOverflow=preventOverflow, \ - VectorWidthB=self.VectorWidthB) + ss.setupStoreElementsForBatch(kernel, gwvw, batchElements, batchElementSgprs, preventOverflow=preventOverflow) loadsIssued = 0 storesIssued = 0 @@ -15402,9 +15354,9 @@ def initializeStoreCInUnrollAddrIncValues(self, kernel): totalTT0 = totalTT0 if kernel["SourceSwap"] else (totalTT0 * outputsPerThread) totalTT1 = (totalTT1 * outputsPerThread) if kernel["SourceSwap"] else totalTT1 - vectorWidth0 = kernel["VectorWidth"] if kernel["SourceSwap"] else kernel["MIOutputVectorWidth"] - MIOutputVectorWidthAdj = self.VectorWidthB * kernel["MIOutputVectorWidth"] - vectorWidth1 = MIOutputVectorWidthAdj if kernel["SourceSwap"] else 1 + vectorWidth0 = kernel["VectorWidthA"] if kernel["SourceSwap"] else kernel["VectorWidthA"] * kernel["MIOutputVectorWidth"] + vectorWidth1 = kernel["VectorWidthB"] * kernel["MIOutputVectorWidth"] if kernel["SourceSwap"] else kernel["VectorWidthB"] + # To here # Tile allocation patterns (MT=128x128 DGEMM SourceSwap) @@ -15504,7 +15456,7 @@ def initializeStoreCInUnrollAddrIncValues(self, kernel): self.StoreCInUnrollGprIncB2Iterations = self.StoreCInUnrollGprIncB1Iterations * self.StoreCInUnrollnumRows else: # need horizontal offset - self.StoreCInUnrollAddrIncHoffset = kernel["MIWaveGroup"][0] * kernel["VectorWidth"] * kernel["MatrixInstM"] * bpe + self.StoreCInUnrollAddrIncHoffset = kernel["MIWaveGroup"][0] * vectorWidth0 * kernel["MatrixInstM"] * bpe if self.StoreCInUnrollNumInterleaveV == 1: # case 2-1: self.StoreCInUnrollAddrIncV1Iterations = self.StoreCInUnrollNumHorizontalTiles @@ -15594,7 +15546,7 @@ def generateInitialCorDaddrIncrement(self, kernel, CorD): # get StoreC loop iteration times ############################################################################## def getStoreCLoopIterTimes(self, kernel): - StoreCLoopIterTimes = kernel["ThreadTile0"]*kernel["ThreadTile1"] // kernel["VectorWidth"] # 128x128 case, 32 times. 128x64 case, 16 times for double + StoreCLoopIterTimes = kernel["ThreadTile0"]*kernel["ThreadTile1"] // kernel["VectorWidthA"] # 128x128 case, 32 times. 128x64 case, 16 times for double return StoreCLoopIterTimes ############################################################################## @@ -16324,9 +16276,9 @@ def AccToArchMapper(self, kernel): matrixInstBN = 1 if (kernel["MatrixInstN"] == 4) else kernel["MatrixInstBN"] OutputsPerMFMA1B = matrixInstM * matrixInstN // self.kernel["WavefrontSize"] - VectorWidth0 = kernel["VectorWidth"] if kernel["SourceSwap"] else 1 + VectorWidth0 = kernel["VectorWidthA"] outerTT0 = kernel["MIWaveTile"][0] // VectorWidth0 - VectorWidth1 = self.VectorWidthB + VectorWidth1 = kernel["VectorWidthB"] outerTT1 = kernel["MIWaveTile"][1] // VectorWidth1 for wgIdx1 in range(0, outerTT1): @@ -16440,7 +16392,7 @@ def getAccVgprInc1(self,kernel,frequency=1): inc = 0 numReg = self.StoreCInUnrollNumReg numRows = self.StoreCInUnrollnumRows - numReg1Block = numReg * numRows * kernel["VectorWidth"] + numReg1Block = numReg * numRows * kernel["VectorWidthA"] if self.StoreCInUnrollNumHorizontalTiles == 1: if self.StoreCInUnrollNumInterleaveV == 1: # no line interleave case @@ -16462,7 +16414,7 @@ def getAccVgprInc1(self,kernel,frequency=1): def getAccVgprOffsetB1(self,kernel): numReg = self.StoreCInUnrollNumReg numRows = self.StoreCInUnrollnumRows - numReg1Block = numReg * numRows * kernel["VectorWidth"] + numReg1Block = numReg * numRows * kernel["VectorWidthA"] if self.StoreCInUnrollNumHorizontalTiles == 1 and self.StoreCInUnrollNumInterleaveV == 1: offsetV1 = numReg1Block elif self.StoreCInUnrollNumHorizontalTiles > 1 and self.StoreCInUnrollNumInterleaveV > 1: @@ -16480,7 +16432,7 @@ def getAccVgprOffsetB2(self,kernel): if self.StoreCInUnrollNumHorizontalTiles > 1 and self.StoreCInUnrollNumInterleaveV > 1: inc = numReg else: - inc = numReg * kernel["VectorWidth"] * B2Iterations + inc = numReg * kernel["VectorWidthA"] * B2Iterations return inc ############################################################################## @@ -16489,7 +16441,7 @@ def getAccVgprOffsetB2(self,kernel): def getAccVgprOffsetB3(self,kernel): numReg = self.StoreCInUnrollNumReg B3Iterations = self.StoreCInUnrollGprIncB3Iterations - inc = numReg * kernel["VectorWidth"] * B3Iterations + inc = numReg * kernel["VectorWidthA"] * B3Iterations return inc ############################################################################## diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index 7ac9885cd..03dfc1ca4 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -2497,9 +2497,9 @@ def isDirectToVgprDoable(state, tc): %(tc, tc, state["NumLoadsCoalesced%c"%tc], MIindex, state['MIWaveTile'][MIindex], tc, state["GlobalLoadVectorWidth%c"%tc])) return False # Does not work with MIWaveTile < VectorWidth - if state['MIWaveTile'][MIindex] < state["VectorWidth"]: - reject(state, "DirectToVgpr%c does not supports MIWaveTile[%u](=%u) < VectorWidth(=%u)"\ - %(tc, MIindex, state['MIWaveTile'][MIindex], state["VectorWidth"])) + if state['MIWaveTile'][MIindex] < state["VectorWidth%s"%tc]: + reject(state, "DirectToVgpr%c does not supports MIWaveTile[%u](=%u) < VectorWidth%s(=%u)"\ + %(tc, MIindex, state['MIWaveTile'][MIindex], tc, state["VectorWidth%s"%tc])) return False # Does not work with ExpandPointerSwap = False @@ -2508,8 +2508,8 @@ def isDirectToVgprDoable(state, tc): return False # Does not work with TLU + VectorWidth != GlobalLoadVectorWidth (VW = 2 + GRVW = 1 or VW = 1 + GRVW = 2 does not work) - if state["ProblemType"]["TLU%c"%tc] and state["VectorWidth"] != state["GlobalLoadVectorWidth%c"%tc]: - reject(state, "DirectToVgpr%c does not supports TLU + VectorWidth(=%u) != GlobalLoadVectorWidth%c(%u)"%(tc, state["VectorWidth"], tc, state["GlobalLoadVectorWidth%c"%tc])) + if state["ProblemType"]["TLU%c"%tc] and state["VectorWidth%s"%tc] != state["GlobalLoadVectorWidth%c"%tc]: + reject(state, "DirectToVgpr%c does not supports TLU + VectorWidth%s(=%u) != GlobalLoadVectorWidth%c(%u)"%(tc, tc, state["VectorWidth%s"%tc], tc, state["GlobalLoadVectorWidth%c"%tc])) return False # Does not work with FractionalLoad and (not TLU) @@ -2530,8 +2530,8 @@ def isDirectToVgprDoable(state, tc): return False # Does not work with TLU=False and PrefetchLocalRead=1 and VectorWidth>1 - if (not state["ProblemType"]["TLU%c"%tc]) and state["PrefetchLocalRead"] == 1 and state["VectorWidth"] > 1: - reject(state, "DirectToVgpr%c does not supports TLU=False and PrefetchLocalRead=1 and VectorWidth>1)"%(tc)) + if (not state["ProblemType"]["TLU%c"%tc]) and state["PrefetchLocalRead"] == 1 and state["VectorWidth%s"%tc] > 1: + reject(state, "DirectToVgpr%c does not supports TLU=False and PrefetchLocalRead=1 and VectorWidth%s>1)"%(tc, tc)) return False # Does not work with SIA<3 and PGR=2 @@ -2539,11 +2539,6 @@ def isDirectToVgprDoable(state, tc): reject(state, "DirectToVgpr%c does not supports ScheduleIterAlg < 3 and PrefetchGlobalRead==2"%(tc)) return False - # Does not work with DirectToVgprB + SourceSwap=False + VectorWidth>1 - if tc == 'B' and (not state["SourceSwap"]) and state["VectorWidth"]>1: - reject(state, "DirectToVgpr%c does not supports SourceSwap=False and VectorWidth>1"%(tc)) - return False - # Does not work with InnerUnroll>1 if state["InnerUnroll"]>1: reject(state, "DirectToVgpr%c does not supports InnerUnroll>1"%(tc)) @@ -2696,8 +2691,8 @@ def isDirectToLdsDoable(state, tc): reject(state, "ThreadSeparateGlobalRead%c does not work with DTL%c + TLU%c"%(tc, tc, tc)) if state["NumLoadsCoalesced%c"%tc] > 1: reject(state, "ThreadSeparateGlobalRead%c does not work with DirectToLds + NumLoadsCoalesced > 1."%(tc)) - if int(state["WavefrontSize"] * state["GlobalLoadVectorWidth%c"%tc]) < state["_DepthULds"] * state["VectorWidth"]: - reject(state, "ThreadSeparateGlobalRead%c does not work with WavefrontSize * GlobalLoadVectorWidth%c < _DepthULds * VectorWidth."%(tc, tc)) + if int(state["WavefrontSize"] * state["GlobalLoadVectorWidth%c"%tc]) < state["_DepthULds"] * state["VectorWidth%s"%tc]: + reject(state, "ThreadSeparateGlobalRead%c does not work with WavefrontSize * GlobalLoadVectorWidth%c < _DepthULds * VectorWidth%s."%(tc, tc, tc)) # Does not work with LocalSplitU if state["LocalSplitU"] > 1: @@ -2768,6 +2763,7 @@ def ldsPaddingAuto(state, isa): idx01 = 0 if tc == 'A' else 1 charMN = 'M' if tc == 'A' else 'N' numBank = 32 + vw = state["VectorWidth%s"%tc] # LdsBlockSizePerPad and LdsPad setting autoCalcLBSPP = False @@ -2781,7 +2777,7 @@ def ldsPaddingAuto(state, isa): if state["ProblemType"]["TLU%s"%tc] and (not state["UnrollMajorLDS%s"%tc]): state["LdsPad%s"%tc] = 0 else: - state["LdsPad%s"%tc] = state["VectorWidth"] + state["LdsPad%s"%tc] = vw autoAdjusted["LdsPad%s"%tc] = autoCalcLBSPP if state["EnableMatrixInstruction"]: @@ -2790,21 +2786,19 @@ def ldsPaddingAuto(state, isa): LRstride = 0 comment = "" depthU = state["_DepthULds"] - vw = state["VectorWidth"] if tc=='A' else state["VectorWidthB"] - if not state["SourceSwap"]: - vw = 1 # TODO: support non-SourceSwap + vw if state["UnrollMajorLDS%s"%tc]: - LRstrideLine = state["_DepthULds"] + LRstrideLine = depthU comment = "DepthULds" - # if depthU is not power of 2, adjust ldsPad at each line (keep LRstride = 0) - if not (depthU > 0 and (depthU & (depthU - 1)) != 0): - LRstride = LRstrideLine * vw + LRstride = LRstrideLine * vw else: LRstrideLine = state["MacroTile%d"%idx01] comment = "MT0" if state["MIInputPerThread"] > 1: # MIInputPerThread > 1 case, we still need padding to mitigate bank conflict even for non-UnrollMajorLDS case LRstride = LRstrideLine * state["LocalReadVectorWidth"] + # if LRstrideLine is not power of 2, adjust ldsPad at each line (keep LRstride = 0) + if LRstrideLine <= 0 or (LRstrideLine & (LRstrideLine - 1)) != 0: + LRstride = 0 # auto calc for LBSPP if autoCalcLBSPP and LRstride > 0: state["LdsBlockSizePerPad%s"%tc] = max(int(2**(math.ceil(math.log(LRstride * numBytes, 2)))), 128) @@ -3240,30 +3234,82 @@ def assignDerivedParameters(state): #print "staggerStrideShift=", staggerStrideShift, "depthu=", state["DepthU"] state["_staggerStrideShift"] = staggerStrideShift - # VectorWidth default handling - if state["VectorWidth"] < 1: - if state["EnableMatrixInstruction"]: + # Use GlobalReadVectorWidth if it is not -1 + if state["GlobalReadVectorWidth"] != -1: + state["GlobalLoadVectorWidthA"] = state["GlobalReadVectorWidth"] + state["GlobalLoadVectorWidthB"] = state["GlobalReadVectorWidth"] + + if state["EnableMatrixInstruction"]: + # MI case + # VectorWidth default handling + if state["VectorWidth"] < 1: regPerElem = state["ProblemType"]["DataType"].numRegisters() # half: regPE=0.5, vw=2 / int8: regPE=0.25, vw=4 state["VectorWidth"] = int(1//regPerElem) if (regPerElem < 1) else 1 - else: + + if state["VectorWidthB"] < 1: + regPerElem = state["ProblemType"]["DataType"].numRegisters() + # half: regPE=0.5, vw=2 / int8: regPE=0.25, vw=4 + state["VectorWidthB"] = int(1//regPerElem) if (regPerElem < 1) else 1 + # state["VectorWidthB"] = 1 # use 1 to avoid existing kernels getting rejected (backward compatibility) + # DirectToVgpr special case + # allow LocalReadVectorWidthB > 1 for TLUB + MatrixInstruction (this is applicable for B only) + # some more limitations necessary to make this logic work + # - MatrixInstruction + # - TLUB and not UnrollMajorLDSB + # - MIInputPerThread == 1 + # - SourceSwap + # - DirectToVgprB or DirectToVgprA + # - MIWaveTile1 must be multiple of VectorWidthB + # need state["LocalReadVectorWidth"] != -1 for DTVA + # need state["GlobalLoadVectorWidthB"] != -1 for DTVB + if state["EnableMatrixInstruction"] and \ + state["ProblemType"]["TLUB"] and (not state["UnrollMajorLDSB"]) and \ + state["MIInputPerThread"] == 1 and state["SourceSwap"]: + if state["DirectToVgprB"] and state["GlobalLoadVectorWidthB"] != -1: + state["VectorWidthB"] = state["GlobalLoadVectorWidthB"] + elif state["DirectToVgprA"] and state["ProblemType"]["TLUA"] and state["LocalReadVectorWidth"] != -1: + state["VectorWidthB"] = state["LocalReadVectorWidth"] + + # TT0,1 both must be multiples of VW, b/c of rC, rA, rB + if ((state["MIWaveTile"][0] % state["VectorWidth"]) != 0): + if not state["SourceSwap"]: + # non SourceSwap case, change VectorWidth to 1 for backward compatibility (before SourceSwap + VectorWidth support) + state["VectorWidth"] = 1 + else: + reject(state, "MIWaveTile0(%u) should be multiple of VectorWidth(%u)" % (state["MIWaveTile"][0], state["VectorWidth"])) + return + if (state["MIWaveTile"][1] % state["VectorWidthB"]) != 0: + #reject(state, "MIWaveTile1(%u) should be multiple of VectorWidthB(%u)" % (state["MIWaveTile"][1], state["VectorWidthB"])) + #return + # change VectorWidthB to 1 for backward compatibility (before VectorWidthB support) + state["VectorWidthB"] = 1 + if state["StoreRemapVectorWidth"]: + # change VectorWidth and VectorWidthB to 1 for backward compatibility (before SourceSwap + VectorWidth support) + state["VectorWidth"] = 1 + state["VectorWidthB"] = 1 + + else: + # non MI case + # VectorWidth default handling + if state["VectorWidth"] < 1: state["VectorWidth"] = int(4 / state["ProblemType"]["DataType"].numRegisters()) while state["ThreadTile0"] % state["VectorWidth"] != 0 \ or state["ThreadTile1"] % state["VectorWidth"] != 0: state["VectorWidth"] //= 2 - # TT0,1 both must be multiples of VW, b/c of rC, rA, rB - if state["EnableMatrixInstruction"]: - if state["SourceSwap"] and ((state["MIWaveTile"][0] % state["VectorWidth"]) != 0): - reject(state, "MIWaveTile0(%u) should be multiple of VectorWidth(%u)" % (state["MIWaveTile"][0], state["VectorWidth"])) - return - else: + # TT0,1 both must be multiples of VW, b/c of rC, rA, rB if state["ThreadTile0"] % state["VectorWidth"] != 0 \ or state["ThreadTile1"] % state["VectorWidth"] != 0: reject(state, "ThreadTile0 %u or ThreadTile1 %u not a multiple of VectorWidth %u" \ % (state["ThreadTile0"], state["ThreadTile1"], \ state["VectorWidth"])) return + # use VectorWidthB=VectorWidth for non MI case + state["VectorWidthB"] = state["VectorWidth"] + + # use VectorWidthA internally + state["VectorWidthA"] = state["VectorWidth"] if len(problemType["IndicesSummation"]) > 1: # not supported with multiple summations, bug is maybe something with @@ -3291,15 +3337,14 @@ def assignDerivedParameters(state): #if state["KernelLanguage"] == "Assembly" and state["PackSummationDims"]: # reject(state, "PackSummationDims does not yet support assembly") - # Use GlobalReadVectorWidth if it is not -1 - if state["GlobalReadVectorWidth"] != -1: - state["GlobalLoadVectorWidthA"] = state["GlobalReadVectorWidth"] - state["GlobalLoadVectorWidthB"] = state["GlobalReadVectorWidth"] - # Default GlobalLoadVectorWidthA, B for tc in ('A','B'): if state["GlobalLoadVectorWidth%s"%tc] == -1: state["GlobalLoadVectorWidth%s"%tc] = state["VectorWidth"] + if state["KernelLanguage"] == "Assembly": + # asm kernel case, GlobalLoadVectorWidth needs to be at least numElemPerReg + numElemPerReg = int(math.ceil(1 / state["ProblemType"]["DataType"].numRegisters())) + state["GlobalLoadVectorWidth%s"%tc] = max(state["VectorWidth"], numElemPerReg) # reject - GLVWA/B too big if (state["GlobalLoadVectorWidth%s"%tc] * state["ProblemType"]["DataType"].numBytes()) > 16: reject(state, "GlobalLoadVectorWidth%s * DataType.numBytes() > 16"%tc) @@ -3319,8 +3364,8 @@ def assignDerivedParameters(state): if state["EnableMatrixInstruction"]: if state["SourceSwap"]: - if ((state["VectorWidth"] % state["StoreVectorWidth"]) != 0): - reject(state, "MFMA SourceSwap mode doesn't support vw(%u) with svw(%u)" % (state["VectorWidth"], state["StoreVectorWidth"])) + if ((state["VectorWidthA"] % state["StoreVectorWidth"]) != 0): + reject(state, "MFMA SourceSwap mode doesn't support vw(%u) with svw(%u)" % (state["VectorWidthA"], state["StoreVectorWidth"])) return else: if ((state["MIOutputVectorWidth"] % state["StoreVectorWidth"]) != 0): @@ -3328,8 +3373,11 @@ def assignDerivedParameters(state): return # reject - VW too big - if (state["VectorWidth"] * state["ProblemType"]["DataType"].numBytes()) > 16: - reject(state, "VW * DataType.numBytes() > 16") + if (state["VectorWidthA"] * state["ProblemType"]["DataType"].numBytes()) > 16: + reject(state, "VWA * DataType.numBytes() > 16") + return + if (state["VectorWidthB"] * state["ProblemType"]["DataType"].numBytes()) > 16: + reject(state, "VWB * DataType.numBytes() > 16") return # LocalSplitU too large? @@ -3341,7 +3389,7 @@ def assignDerivedParameters(state): return state["NumElementsPerThread"] = numElementsPerWorkGroup // state["NumThreads"] - state["GlobalWriteVectorWidth"] = min(state["VectorWidth"], state["NumElementsPerThread"] ) + state["GlobalWriteVectorWidth"] = min(state["VectorWidthA"], state["NumElementsPerThread"] ) if state["NumElementsPerThread"] % state["GlobalWriteVectorWidth"] != 0: reject(state, "LSU NumElementsPerThread %u not divisible into GWVW %u" \ % (state["NumElementsPerThread"], state["GlobalWriteVectorWidth"])) @@ -3553,10 +3601,7 @@ def assignDerivedParameters(state): validDepthU = False else: GlobalLoadVectorWidthA = GlobalLoadVectorWidthAorig - if state["DirectToVgprA"]: - if not state["SourceSwap"]: - GlobalLoadVectorWidthA = 1 # adjust GlobalLoadVectorWidth to 1 in DirectToVgpr case (except for DirectToVgprA + SourceSwap) - elif state["DirectToLdsA"] and (bpeAB * GlobalLoadVectorWidthA) > 4: + if state["DirectToLdsA"] and (bpeAB * GlobalLoadVectorWidthA) > 4: # bpe * grvw must be <= 4 for DirectToLds (lds flag only for <= 32bit load) GlobalLoadVectorWidthA = 4 / bpeAB # use float only for <1. Otherwise, convert to int @@ -3788,31 +3833,22 @@ def assignDerivedParameters(state): # - TLUB and not UnrollMajorLDSB # - MIInputPerThread == 1 # - SourceSwap - # - DirectToVgprB or DirectToVgprA - # - MIWaveTile1 must be multiple of VectorWidthB + # - DirectToVgprA # need to check after state["LocalReadVectorWidth"] = -1 is resolved - VectorWidthB = 1 + wideLRVWBforTLUBallowed = False if state["EnableMatrixInstruction"] and \ state["ProblemType"]["TLUB"] and (not state["UnrollMajorLDSB"]) and \ state["MIInputPerThread"] == 1 and state["SourceSwap"]: - if state["DirectToVgprB"]: - VectorWidthB = state["GlobalLoadVectorWidthB"] - if state["MIWaveTile"][1] % VectorWidthB != 0: - reject(state, "DirectToVgprB does not support MIWaveTile1 is not multiple of GlobalLoadVectorWidthB") - elif state["DirectToVgprA"] and state["ProblemType"]["TLUA"]: - VectorWidthB = state["LocalReadVectorWidth"] - if state["MIWaveTile"][1] % VectorWidthB != 0: - # cannot use wider local read - reject(state, "DirectToVgprA does not support MIWaveTile1 is not multiple of LocalReadVectorWidth") - - state["VectorWidthB"] = VectorWidthB + if state["DirectToVgprA"] and state["ProblemType"]["TLUA"] and state["VectorWidthB"] == state["LocalReadVectorWidth"]: + wideLRVWBforTLUBallowed = True + # LocalReadVectorWidth check if state["EnableMatrixInstruction"]: if state["LocalReadVectorWidth"] < state["MIInputPerThread"]: reject(state, "LocalReadVectorWidth < %u" %(state["MIInputPerThread"])) if state["LocalReadVectorWidth"] > state["MIInputPerThread"] and not (state["UnrollMajorLDSA"] or state["UnrollMajorLDSB"]) \ - and not (state["DirectToVgprA"] and state["LocalReadVectorWidth"] == VectorWidthB): + and not (state["DirectToVgprA"] and state["LocalReadVectorWidth"] == state["VectorWidthB"] and wideLRVWBforTLUBallowed): reject(state, "LocalReadVectorWidth require Transpose LDS") if state["LocalReadVectorWidth"] > state["MIInputPerThread"] and \ (state["UnrollMajorLDSA"] and (not state["UnrollMajorLDSB"])) and \ @@ -4212,7 +4248,7 @@ def assignDerivedParameters(state): if state["PrefetchAcrossPersistentMode"] == 0: reject(state, "StoreCInUnroll requires PrefetchAcrossPersistentMode") return - if state["ProblemType"]["DataType"].isDouble() and state["VectorWidth"] != 2: + if state["ProblemType"]["DataType"].isDouble() and state["VectorWidthA"] != 2: reject(state, "StoreCInUnroll requires VectorWidth=2 for dgemm") return if state["AtomicAddC"] and state["StoreVectorWidth"] != 1: @@ -4245,6 +4281,9 @@ def assignDerivedParameters(state): if not state["BufferStore"]: reject(state, "StoreCInUnroll requires BufferStore feature") return + if state["VectorWidthB"] > 1: + reject(state, "StoreCInUnroll + VectorWidthB > 1 not supported yet") + return # minimum K check # PGR=2 requires minimum K @@ -4259,7 +4298,7 @@ def assignDerivedParameters(state): # StoreCInUnrollExact requires exact K if state["StoreCInUnrollExact"]: # K == DepthU * ThreadTile0 * ThreadTile1 // VectorWidth is necessary - exactK = state["DepthU"] * state["ThreadTile0"] * state["ThreadTile1"] // state["VectorWidth"] + exactK = state["DepthU"] * state["ThreadTile0"] * state["ThreadTile1"] // state["VectorWidthA"] if not (3 in state["AssertSizeEqual"].keys() and state["AssertSizeEqual"][3] == exactK): reject(state, "StoreCInUnrollExact does not work if AssertSizeEqual for K is not DepthU * ThreadTile0 * ThreadTile1 / VectorWidth") return @@ -4545,13 +4584,6 @@ def assignDerivedParameters(state): (state["ThreadTile0"] == 4 and state["ThreadTile1"] == 8)): reject(state, "UnrollLoopEfficiencyEnable does not support ThreadTile0,1 = [%u,%u]"%(state["ThreadTile0"], state["ThreadTile1"])) - # reject check for ClusterLocalRead - if state["ClusterLocalRead"]: - # Requires VgprForLocalReadPacking - if not state["VgprForLocalReadPacking"]: - reject(state, "ClusterLocalRead works with VgprForLocalReadPacking") - return - # reject check for VgprForLocalReadPacking if state["VgprForLocalReadPacking"]: # MatrixInstruction only @@ -4571,6 +4603,17 @@ def assignDerivedParameters(state): reject(state, "VgprForLocalReadPacking is effective only fof 1 or 2 byte input + UnrollMajorLDSA or B =false") return + # reject check for ClusterLocalRead + if state["ClusterLocalRead"]: + # Requires VgprForLocalReadPacking + if not state["VgprForLocalReadPacking"]: + reject(state, "ClusterLocalRead works with VgprForLocalReadPacking") + return + if (state["UnrollMajorLDSA"] == False and state["VectorWidthA"] > state["MIInputPerThread"]) or\ + (state["UnrollMajorLDSB"] == False and state["VectorWidthB"] > state["MIInputPerThread"]): + reject(state, "ClusterLocalRead does not support VectorWidth or VectorWidthB > MIInputPerThread") + return + ######################################## # create a dictionary with booleans on whether to include parameter in name @staticmethod diff --git a/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma.yaml b/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma.yaml index 5f14e5397..724b5fbfe 100644 --- a/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma.yaml +++ b/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma.yaml @@ -241,3 +241,55 @@ BenchmarkProblems: - ProblemSizes: - Exact: [ 252, 252, 1, 2050] + ######################################## + # HSS NT - LSU + VWB + VFLRP + CLR + ######################################## + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - MatrixInstruction: + - [16, 16, 16, 1, 1, 4, 4, 2,1] # 128x64 + - [16, 16, 16, 1, 1, 4, 4, 2,2] # 128x128 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + - [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [4]#[1,2,4] + - AssertFree1ElementMultiple : [4]#[1,2,4] + - AssertSummationElementMultiple: [2] + - DepthU: [32,64]#[8,16,32] + #- GlobalSplitU: [1,4] + #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - 1LDSBuffer: [0] + - LoopTail: [True] + - OptNoLoadLoop: [1] + - PrefetchGlobalRead: [2] + - PrefetchLocalRead: [3,5]#[1,3,5,9] + - ScheduleIterAlg: [3] + - StaggerU: [0] + - SourceSwap: [0,1] + #- TransposeLDS: [0,1] + - GlobalReadVectorWidth: [4] + - VectorWidth: [2,4] + - VectorWidthB: [1,2,4] + #- VectorAtomicWidth: [-1,1,2] + #- WaveSeparateGlobalReadB: [1] + #- MIArchVgpr: [True, False] + - NumElementsPerBatchStore: [0] + #- UseSgprForGRO: [0] + #- BufferLoad: [0,1] + #- BufferStore: [0,1] + #- GlobalSplitUAtomicAdd: [0,1] + - VgprForLocalReadPacking: [0,1] + - ClusterLocalRead: [0,1] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Exact: [ 252, 252, 1, 2050] + diff --git a/Tensile/Tests/extended/local_split_u/igemm_lsu_mfma.yaml b/Tensile/Tests/extended/local_split_u/igemm_lsu_mfma.yaml index e1b715732..fcf44d03d 100644 --- a/Tensile/Tests/extended/local_split_u/igemm_lsu_mfma.yaml +++ b/Tensile/Tests/extended/local_split_u/igemm_lsu_mfma.yaml @@ -80,6 +80,57 @@ BenchmarkProblems: - ProblemSizes: - Exact: [ 252, 254, 1, 2050] + ######################################## + # I8II NT - LSU + VFLRP + VWB + ######################################## + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - MatrixInstruction: + - [16, 16, 16, 1, 1, 8, 8, 2,1] # 256x128 + - [16, 16, 16, 1, 1, 8, 8, 2,2] # 256x256 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + - [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [4] + - AssertFree1ElementMultiple : [4] + - AssertSummationElementMultiple: [4] + - DepthU: [32,64]#[8,16,32] + #- GlobalSplitU: [1,4] + #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - 1LDSBuffer: [0] + - LoopTail: [True] + - OptNoLoadLoop: [1] + - PrefetchGlobalRead: [2] + - PrefetchLocalRead: [1,3,5] + - ScheduleIterAlg: [3] + - StaggerU: [0] + - SourceSwap: [0,1] + #- TransposeLDS: [0,1] + - GlobalReadVectorWidth: [4,8,16] + - VectorWidth: [2,4,8] + - VectorWidthB: [1,2,4,8] + #- VectorAtomicWidth: [-1,1,2] + #- WaveSeparateGlobalReadB: [1] + #- MIArchVgpr: [True, False] + - NumElementsPerBatchStore: [4] + - UseSgprForGRO: [0] + #- BufferLoad: [0,1] + #- BufferStore: [0,1] + - VgprForLocalReadPacking: [0,1] + - ClusterLocalRead: [0,1] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Exact: [ 252, 252, 1, 2052] + ######################################## # I8II NT - LSU + GSU + MIB>1 ######################################## diff --git a/Tensile/Tests/extended/local_split_u/sgemm_lsu_mfma.yaml b/Tensile/Tests/extended/local_split_u/sgemm_lsu_mfma.yaml index 72cf67ed8..3a0fc9e25 100644 --- a/Tensile/Tests/extended/local_split_u/sgemm_lsu_mfma.yaml +++ b/Tensile/Tests/extended/local_split_u/sgemm_lsu_mfma.yaml @@ -240,6 +240,59 @@ BenchmarkProblems: - ProblemSizes: - Exact: [1020, 1020, 1, 2052] + ######################################## + # NT - LSU + VWB + ######################################## + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - MatrixInstruction: + - [16, 16, 4, 1, 1, 4,4, 2,1] # 128x64 + - [16, 16, 4, 1, 1, 4,4, 1,2] # 64x128 + - [16, 16, 4, 1, 1, 4,4, 2,2] # 128x128 + - [16, 16, 4, 1, 1, 4,4, 4,1] # 256x64 + - [16, 16, 4, 1, 1, 4,4, 1,4] # 64x256 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + - [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - DepthU: [16] + #- GlobalSplitU: [1,2] + #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + #- GlobalSplitUWorkGroupMappingRoundRobin: [False] + #- GlobalSplitUSummationAssignmentRoundRobin: [True] + - 1LDSBuffer: [0] + #- AssertFree0ElementMultiple : [8] + - AssertFree1ElementMultiple : [4]#[1,4] + - ExpandPointerSwap: [1] # 1 for DirectToVgpr + - PrefetchGlobalRead: [1] # should be 1 for DTVA+DTVB + - PrefetchLocalRead: [1] + - SuppressNoLoadLoop: [0] + - ScheduleLocalWrite: [1] + - ScheduleGlobalRead: [1] + - ScheduleIterAlg: [3]#[0] + - StaggerU: [0] + - SourceSwap: [0,1] + #- TransposeLDS: [1] + - GlobalReadVectorWidth: [1,2,4] + - VectorWidth: [1,2,4] + - VectorWidthB: [1,2,4] + - LocalReadVectorWidth: [1,2,4] + - DirectToVgprA: [True, False] + - DirectToVgprB: [True, False] + #- MIArchVgpr: [False, True] + - NumElementsPerBatchStore: [2] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Exact: [1020, 1020, 1, 2052] + ######################################## # TT - standard ######################################## From a700951dddd668b9b4423f2482b5e5098c262c54 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Fri, 12 Jan 2024 11:14:21 -0700 Subject: [PATCH 31/51] Update xfail, 1sum tests only failing on gfx90a (#1866) --- Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml | 2 +- Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml b/Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml index def472522..fb89bd28e 100644 --- a/Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml +++ b/Tensile/Tests/extended/multi_sum_psd/1sum_gsu_simple.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [xfail] + marks: [xfail-gfx90a] GlobalParameters: EnqueuesPerSync: 1 diff --git a/Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml b/Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml index fa615a065..e135af53e 100644 --- a/Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml +++ b/Tensile/Tests/extended/multi_sum_psd/1sum_simple.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [xfail] + marks: [xfail-gfx90a] GlobalParameters: EnqueuesPerSync: 1 From de6fc55839731956f756f8a5848600eea1a38e09 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Sat, 13 Jan 2024 11:22:08 +0900 Subject: [PATCH 32/51] enable VgprForLocalReadPacking + PrefetchLocalRead=1 (#1864) - removed the reject condition for VFLRP + PLR=1 - added test cases for VFLRP + PLR=1 --- Tensile/SolutionStructs.py | 6 +++--- Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml | 5 +++-- Tensile/Tests/extended/direct_to_vgpr/dtv_igemm.yaml | 4 ++-- 3 files changed, 8 insertions(+), 7 deletions(-) diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index 03dfc1ca4..5f94cfa9f 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -4594,9 +4594,9 @@ def assignDerivedParameters(state): if not globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"]: reject(state, "VgprForLocalReadPacking is for EccHalf only") return - # only for SIA=3 + PLR>1 - if not (state["ScheduleIterAlg"] == 3 and state["PrefetchLocalRead"] > 1): - reject(state, "VgprForLocalReadPacking is effective only fof SIA=3 and PLR>1") + # only for SIA=3 + PLR>=1 + if not (state["ScheduleIterAlg"] == 3 and state["PrefetchLocalRead"] >= 1): + reject(state, "VgprForLocalReadPacking is effective only fof SIA=3 and PLR>=1") return # only for 1 or 2 byte input (numRegister < 1) + UnrollMajorLDSA or B is False if not (state["ProblemType"]["DataType"].numRegisters() < 1 and (state["UnrollMajorLDSA"] == False or state["UnrollMajorLDSB"] == False)): diff --git a/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml b/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml index 1c1212fc2..b237842a3 100644 --- a/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml +++ b/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml @@ -217,7 +217,7 @@ BenchmarkProblems: - DepthU: [32,64] - 1LDSBuffer: [0] - PrefetchGlobalRead: [1]#[1,2] - - PrefetchLocalRead: [2,3,5,9] + - PrefetchLocalRead: [1,2,3,5,9] - ScheduleIterAlg: [3] #- StaggerU: [0,32] - SourceSwap: [1]#[0,1] @@ -225,6 +225,7 @@ BenchmarkProblems: - GlobalReadVectorWidth: [2,4,8] - LocalReadVectorWidth: [2,4,8] - VectorWidth: [1,2] + - VectorWidthB: [1,2] #- WaveSeparateGlobalReadB: [1] - NumElementsPerBatchStore: [4] - UseSgprForGRO: [0] @@ -232,7 +233,7 @@ BenchmarkProblems: - DirectToLdsA: [False, True] - DirectToLdsB: [False, True] - NumLoadsCoalescedA: [1] - - BufferLoad: [0,1] + #- BufferLoad: [0,1] - GlobalSplitU: [1,2] - GlobalSplitUAlgorithm: ["SingleBuffer"] - VgprForLocalReadPacking: [1] diff --git a/Tensile/Tests/extended/direct_to_vgpr/dtv_igemm.yaml b/Tensile/Tests/extended/direct_to_vgpr/dtv_igemm.yaml index a37995b89..b8d26d029 100644 --- a/Tensile/Tests/extended/direct_to_vgpr/dtv_igemm.yaml +++ b/Tensile/Tests/extended/direct_to_vgpr/dtv_igemm.yaml @@ -325,7 +325,7 @@ BenchmarkProblems: - DepthU: [32,64] - 1LDSBuffer: [0] - PrefetchGlobalRead: [1]#[1,2] - - PrefetchLocalRead: [2,3,5,9] + - PrefetchLocalRead: [1,2,3,5,9] - ScheduleIterAlg: [3] - StaggerU: [0,32] - SourceSwap: [1]#[0,1] @@ -663,7 +663,7 @@ BenchmarkProblems: - DepthU: [32,64] - 1LDSBuffer: [0] - PrefetchGlobalRead: [1]#[1,2] - - PrefetchLocalRead: [2,3,5,9] + - PrefetchLocalRead: [1,2,3,5,9] - ScheduleIterAlg: [3] #- StaggerU: [0,32] - SourceSwap: [1]#[0,1] From ddb1e9a26b79f5f3e0ff79b09dbadc65c2d5a381 Mon Sep 17 00:00:00 2001 From: David Galiffi Date: Thu, 11 Jan 2024 18:35:10 -0500 Subject: [PATCH 33/51] Update link to Wiki page Change "ROCmSoftwarePlatform" to "ROCm" --- README.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/README.md b/README.md index 149ee7900..0aa351e9e 100644 --- a/README.md +++ b/README.md @@ -2,4 +2,4 @@ Tensile is a tool for creating benchmark-driven backend libraries for GEMMs, GEM The Tensile library is mainly used as backend library to rocBLAS. Tensile acts as the performance backbone for a wide variety of 'compute' applications running on AMD GPUs. -See [Tensile Wiki](https://github.com/ROCmSoftwarePlatform/Tensile/wiki) for documentation. +See [Tensile Wiki](https://github.com/ROCm/Tensile/wiki) for documentation. From 29532c917114d923ba22b08d8f74bc9ded7e229c Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Tue, 16 Jan 2024 09:01:25 -0700 Subject: [PATCH 34/51] Add new tuning scripts (#1865) Add new tuning scripts to analyze rocblas-bench results and remove tuned sizes from liblogic --- tuning/automation/ListSizes.py | 109 +++++++++++++++++++++++++++++++ tuning/automation/RemoveSizes.py | 91 ++++++++++++++++++++++++++ 2 files changed, 200 insertions(+) create mode 100644 tuning/automation/ListSizes.py create mode 100644 tuning/automation/RemoveSizes.py diff --git a/tuning/automation/ListSizes.py b/tuning/automation/ListSizes.py new file mode 100644 index 000000000..0702fbc36 --- /dev/null +++ b/tuning/automation/ListSizes.py @@ -0,0 +1,109 @@ +################################################################################ +# +# Copyright (C) 2024 Advanced Micro Devices, Inc. All rights reserved. +# +# Permission is hereby granted, free of charge, to any person obtaining a copy +# of this software and associated documentation files (the "Software"), to deal +# in the Software without restriction, including without limitation the rights +# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +# copies of the Software, and to permit persons to whom the Software is +# furnished to do so, subject to the following conditions: +# +# The above copyright notice and this permission notice shall be included in +# all copies or substantial portions of the Software. +# +# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +# SOFTWARE. +# +################################################################################ + +# Generates a CSV file listing sizes that have improved performance between rocblas-bench runs. +# To use, run rocblas-bench and save the output to a file. +# Run rocblas-bench again with the same problem sizes and a new library to be compared. +# Use this script to compare the two sets of results and generate a CSV containing a list of sizes that have improved. +# Usage: +# $ python3 ListSizes.py [-v] + +import argparse +import csv + +from decimal import Decimal + +def parseArgs(): + argParser = argparse.ArgumentParser() + + h = {"baseBench" : "Results of baseline benchmark", + "newBench" : "Results of new benchmark", + "sizeList" : "Output CSV file listing sizes faster in new benchmark", + "verbose" : "Verbose output" + } + + argParser.add_argument("baseBench", type=str, help=h["baseBench"]) + argParser.add_argument("newBench", type=str, help=h["newBench"]) + argParser.add_argument("sizeList", type=str, help=h["sizeList"]) + argParser.add_argument("--verbose", "-v", action="store_true", help=h["verbose"]) + + return argParser.parse_args() + +def main(): + args = parseArgs() + if args.verbose: + print("List winning sizes") + print("Base benchmark : " + args.baseBench) + print("New benchmark : " + args.newBench) + print("Sizes file : " + args.sizeList) + + baseData = [] + with open(args.baseBench) as baseFile: + for line in baseFile: + if line.startswith("transA,"): + labels = line.split(",") + mIdx = labels.index("M") + nIdx = labels.index("N") + kIdx = labels.index("K") + bIdx = labels.index("batch_count") + gflopsIdx = labels.index("rocblas-Gflops") + dataLine = next(baseFile) + data = dataLine.split(",") + data = [d.strip() for d in data] + baseData.append([int(data[mIdx]), int(data[nIdx]), int(data[bIdx]), int(data[kIdx]), Decimal(data[gflopsIdx])]) + + newData = [] + with open(args.newBench) as newFile: + for line in newFile: + if line.startswith("transA,"): + labels = line.split(",") + mIdx = labels.index("M") + nIdx = labels.index("N") + kIdx = labels.index("K") + bIdx = labels.index("batch_count") + gflopsIdx = labels.index("rocblas-Gflops") + dataLine = next(newFile) + data = dataLine.split(",") + data = [d.strip() for d in data] + newData.append([int(data[mIdx]), int(data[nIdx]), int(data[bIdx]), int(data[kIdx]), Decimal(data[gflopsIdx])]) + + sizeData = [] + for n in newData: + for b in baseData: + if n[0] == b[0] and n[1] == b[1] and n[2] == b[2] and n[3] == b[3]: + if n[4] >= b[4]: + sizeData.append([n[0], n[1], n[2], n[3]]) + if args.verbose: + print("Adding: {}".format([n[0], n[1], n[2], n[3]])) + break + + with open(args.sizeList, "w") as sizeFile: + csvWriter = csv.writer(sizeFile) + csvWriter.writerows(sizeData) + + if args.verbose: + print("Done writing size list") + +if __name__ == "__main__": + main() diff --git a/tuning/automation/RemoveSizes.py b/tuning/automation/RemoveSizes.py new file mode 100644 index 000000000..dfe46ce6e --- /dev/null +++ b/tuning/automation/RemoveSizes.py @@ -0,0 +1,91 @@ +################################################################################ +# +# Copyright (C) 2024 Advanced Micro Devices, Inc. All rights reserved. +# +# Permission is hereby granted, free of charge, to any person obtaining a copy +# of this software and associated documentation files (the "Software"), to deal +# in the Software without restriction, including without limitation the rights +# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell +# copies of the Software, and to permit persons to whom the Software is +# furnished to do so, subject to the following conditions: +# +# The above copyright notice and this permission notice shall be included in +# all copies or substantial portions of the Software. +# +# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, +# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE +# SOFTWARE. +# +################################################################################ + +# Removes tuned sizes from a library logic file. +# Usage: +# $ python3 RemoveSizes.py [-v] + +import argparse +import csv +import yaml + +def parseArgs(): + argParser = argparse.ArgumentParser() + + h = {"inLogic" : "Input library logic file", + "outLogic" : "Output library logic file", + "sizeList" : "CSV file containing list of sizes to remove", + "verbose" : "Verbose output" + } + + argParser.add_argument("inLogic", type=str, help=h["inLogic"]) + argParser.add_argument("outLogic", type=str, help=h["outLogic"]) + argParser.add_argument("sizeList", type=str, help=h["sizeList"]) + argParser.add_argument("--verbose", "-v", action="store_true", help=h["verbose"]) + + return argParser.parse_args() + +def main(): + args = parseArgs() + if args.verbose: + print("Removing tuned sizes") + print("Input Logic : " + args.inLogic) + print("Output Logic: " + args.outLogic) + print("Sizes File : " + args.sizeList) + + with open(args.inLogic) as inFile: + logicData = yaml.safe_load(inFile) + + mapping = logicData[7] + if args.verbose: + print("Initial size count = {}".format(len(mapping))) + + with open(args.sizeList) as csvFile: + reader = csv.reader(csvFile) + for row in reader: + found = False + m = int(row[0]) + n = int(row[1]) + b = int(row[2]) + k = int(row[3]) + for tune in mapping: + size = tune[0] + if size[0] == m and size[1] == n and size[2] == b and size[3] == k: + mapping.remove(tune) + found = True + break + if args.verbose: + print("{} {}".format([m, n, b, k], "removed" if found else "not found")) + + if args.verbose: + print("Final size count = {}".format(len(mapping))) + + with open(args.outLogic, "w") as outFile: + yaml.safe_dump(logicData, outFile, default_flow_style=None, sort_keys=False, width=5000) + + if args.verbose: + print("Done writing new logic file") + +if __name__ == "__main__": + main() From d2ee2a1d7523c60c50aea1d38d9bdc6b43ebaaf0 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Wed, 17 Jan 2024 15:31:20 -0700 Subject: [PATCH 35/51] Stream-K Batch (#1861) Batch support for Stream-K kernels and new test cases Update rocBLAS liblogic converter script to work with old logics Reject case for general batch --- Tensile/Components/Signature.py | 4 +- Tensile/KernelWriterAssembly.py | 11 +++++- Tensile/SolutionStructs.py | 4 +- .../Source/lib/source/ContractionProblem.cpp | 3 +- .../Source/lib/source/ContractionSolution.cpp | 14 ++++++- .../extended/stream_k/sk_2tile_hgemm_hhs.yaml | 25 +++++++----- .../extended/stream_k/sk_2tile_sgemm.yaml | 38 ++++++++----------- .../Tests/extended/stream_k/sk_hgemm_hhs.yaml | 25 +++++++----- Tensile/Tests/extended/stream_k/sk_sgemm.yaml | 38 ++++++++----------- .../automation/rocblas-benchInputCreator.py | 4 +- 10 files changed, 93 insertions(+), 73 deletions(-) diff --git a/Tensile/Components/Signature.py b/Tensile/Components/Signature.py index 665f2bef2..fef52d471 100644 --- a/Tensile/Components/Signature.py +++ b/Tensile/Components/Signature.py @@ -275,6 +275,8 @@ def __call__(self, writer): if kernel["StreamK"]: kStr += self.addArgument("MagicNumberProblemNumGroupTiles0", '4', offset, "by_value", "u32"); offset += 4 kStr += self.addArgument("MagicShiftProblemNumGroupTiles0", '4', offset, "by_value", "u32"); offset += 4 + kStr += self.addArgument("MagicNumProblemNumGroupTiles0By1", '4', offset, "by_value", "u32"); offset += 4 + kStr += self.addArgument("MagicShiftProblemNumGroupTiles0By1", '4', offset, "by_value", "u32"); offset += 4 if kernel["PersistentKernel"]: kStr += self.addArgument("MagicNumberProblemNumGroupTiles0", '4', offset, "by_value", "u32"); offset += 4 @@ -290,7 +292,7 @@ def __call__(self, writer): kStr += self.addArgument("MagicNumberItersPerTile", '4', offset,"by_value", "u32"); offset += 4 kStr += self.addArgument("MagicShiftItersPerTile", '4', offset,"by_value", "u32"); offset += 4 kStr += self.addArgument("TotalIters", '4', offset,"by_value", "u32"); offset += 4 - kStr += self.addArgument("SKItersPerWG", '4', offset,"by_value", "u32"); offset += 4 + kStr += self.addArgument("SKItersPerWG", '4', offset,"by_value", "u32"); offset += 4 if kernel["StreamK"] == 3: # Two-tile SK kStr += self.addArgument("skGrid", '4', offset,"by_value", "u32"); offset += 4 kStr += self.addArgument("skTiles", '4', offset,"by_value", "u32"); offset += 4 diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index ad39ae82a..585697148 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -1930,9 +1930,11 @@ def initKernel(self, kernel, tPA, tPB ): self.defineSgpr("ItersPerTile", 1) self.defineSgpr("MagicNumberItersPerTile", 1) self.defineSgpr("MagicShiftItersPerTile", 1) + self.defineSgpr("MagicNumProblemNumGroupTiles0By1", 1) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) + self.defineSgpr("MagicShiftProblemNumGroupTiles0By1", 1) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) self.defineSgpr("TotalIters", 1) self.defineSgpr("SKItersPerWG", 1) - skArgumentToLoad += 7 + skArgumentToLoad += 9 if kernel["StreamK"] == 3: # Two-tile SK self.defineSgpr("skGrid", 1) self.defineSgpr("skTiles", 1) @@ -3789,7 +3791,12 @@ def graWorkGroup(self, kernel, isPap): kStr += inst("s_mov_b32", sgpr("StreamKIter"), sgpr(stmp+2), "Increment StreamK Iteration") # Map StreamK tile index to wg0/1 - kStr += self.comment1("Map StreamK tile index to wg0/1") + kStr += self.comment1("Map StreamK tile index to wg0/1/2") + kStr += self.sMagicDivAlg2(kernel, stmp+1, sgpr(stmp), sgpr("MagicNumProblemNumGroupTiles0By1"), sgpr("MagicShiftProblemNumGroupTiles0By1")) + kStr += inst("s_mov_b32", sgpr("WorkGroup2"), sgpr(stmp+1), "wg2 = Tile Idx / problemNumGroupTiles0By1") + kStr += inst("s_mul_i32", sgpr(stmp+1), sgpr(stmp+1), sgpr("NumWorkGroups0"), "remainder part 1 : quotient * divisor") + kStr += inst("s_mul_i32", sgpr(stmp+1), sgpr(stmp+1), sgpr("NumWorkGroups1"), "remainder part 1 : quotient * divisor") + kStr += inst("s_sub_u32", sgpr(stmp), sgpr(stmp), sgpr(stmp+1), "remainder") kStr += self.sMagicDivAlg2(kernel, stmp+1, sgpr(stmp), sgpr("MagicNumberProblemNumGroupTiles0"), sgpr("MagicShiftProblemNumGroupTiles0")) kStr += inst("s_mov_b32", sgpr("WorkGroup1"), sgpr(stmp+1), "wg1 = Tile Idx / problemNumGroupTiles0") kStr += inst("s_mul_i32", sgpr("WorkGroup0"), sgpr(stmp+1), sgpr("NumWorkGroups0"), "remainder part 1 : quotient * divisor") diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index 5f94cfa9f..86012f527 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -2938,8 +2938,8 @@ def assignDerivedParameters(state): reject(state, "Cannot enable both Stream-K and GSU") if state["PersistentKernel"]: reject(state, "Cannot enable both Stream-K and PersistentKernel") - if not (2 in state["AssertSizeEqual"].keys() and state["AssertSizeEqual"][2] == 1): - reject(state, "Stream-K with batch requires further testing") + if not state["ProblemType"]["StridedBatched"]: + reject(state, "General batch not supported with Stream-K") if state["StreamK"] == 1: if not state["ProblemType"]["DataType"].isSingle(): reject(state, "Atomic Stream-K currently only tested for SGEMM") diff --git a/Tensile/Source/lib/source/ContractionProblem.cpp b/Tensile/Source/lib/source/ContractionProblem.cpp index 20724e037..8c3f409e8 100644 --- a/Tensile/Source/lib/source/ContractionProblem.cpp +++ b/Tensile/Source/lib/source/ContractionProblem.cpp @@ -781,8 +781,7 @@ namespace Tensile numWG.y *= sizeMapping.globalSplitU; size_t problemTiles = numWG.x * numWG.y; - // if(sizeMapping.persistentKernelAlongBatch || sizeMapping.streamK != 0) - if(sizeMapping.persistentKernelAlongBatch) + if(sizeMapping.persistentKernelAlongBatch || sizeMapping.streamK != 0) problemTiles *= numWG.z; return problemTiles; diff --git a/Tensile/Source/lib/source/ContractionSolution.cpp b/Tensile/Source/lib/source/ContractionSolution.cpp index aef694c6e..81372fee3 100644 --- a/Tensile/Source/lib/source/ContractionSolution.cpp +++ b/Tensile/Source/lib/source/ContractionSolution.cpp @@ -327,8 +327,7 @@ namespace Tensile skGrid = getSKGrid(hardware, tiles); rv.numWorkGroups.x = skGrid; rv.numWorkGroups.y = 1; - if(sizeMapping.persistentKernelAlongBatch) - rv.numWorkGroups.z = 1; + rv.numWorkGroups.z = 1; } } @@ -625,6 +624,17 @@ namespace Tensile rv.args.append("itersPerTile", itersPerTile); rv.args.append("magicNumberItersPerTile", magicNumberItersPerTile); rv.args.append("magicShiftItersPerTile", magicShiftItersPerTile); + + uint32_t numGroupTiles0x1 = problemNumGroupTiles0 * problemNumGroupTiles1; + uint32_t magicNumProblemNumGroupTiles0By1; + uint32_t magicShiftProblemNumGroupTiles0By1; + magicNumProblemNumGroupTiles0By1 + = magicNumber(2, numGroupTiles0x1, &magicShiftProblemNumGroupTiles0By1); + rv.args.append("magicNumProblemNumGroupTiles0By1", + magicNumProblemNumGroupTiles0By1); + rv.args.append("magicShiftProblemNumGroupTiles0By1", + magicShiftProblemNumGroupTiles0By1); + rv.args.append("totalIters", totalIters); if(sizeMapping.streamK < 3) // Basic SK { diff --git a/Tensile/Tests/extended/stream_k/sk_2tile_hgemm_hhs.yaml b/Tensile/Tests/extended/stream_k/sk_2tile_hgemm_hhs.yaml index ae148065f..11789390a 100644 --- a/Tensile/Tests/extended/stream_k/sk_2tile_hgemm_hhs.yaml +++ b/Tensile/Tests/extended/stream_k/sk_2tile_hgemm_hhs.yaml @@ -6,7 +6,7 @@ GlobalParameters: BoundsCheck: True KernelTime: True DataInitTypeAlpha: 1 - DataInitTypeBeta: 0 + DataInitTypeBeta: 1 # DataInitTypeA: 1 # DataInitTypeB: 1 # DataInitTypeC: 1 @@ -29,7 +29,7 @@ BenchmarkProblems: HighPrecisionAccumulate: True # True if DataType != ComputeDataType TransposeA: False TransposeB: True - UseBeta: False + UseBeta: True Batched: True - # BenchmarkProblemSizeGroup - Standard @@ -73,16 +73,23 @@ BenchmarkProblems: # - NumElementsPerBatchStore: [8] - AssertAlphaValue: [1] - GlobalReadVectorWidth: [8] - - AssertSizeEqual: [{2: 1}] BenchmarkForkParameters: JoinParameters: BenchmarkJoinParameters: BenchmarkFinalParameters: - ProblemSizes: - - Range: [ [4096], [4096], [1], [1024] ] - - Range: [ [4103], [4096], [1], [1024] ] - - Range: [ [4096], [4103], [1], [1024] ] - - Range: [ [4103], [4103], [1], [1024] ] - - Range: [ [4096], [4096], [1], [1031] ] - - Range: [ [4103], [4103], [1], [1031] ] + - Exact: [ 512, 512, 1, 512 ] + - Exact: [ 4096, 4096, 1, 1024 ] + - Exact: [ 4103, 4096, 1, 1024 ] + - Exact: [ 4096, 4103, 1, 1024 ] + - Exact: [ 4103, 4103, 1, 1024 ] + - Exact: [ 4096, 4096, 1, 1031 ] + - Exact: [ 4103, 4103, 1, 1031 ] + - Exact: [ 512, 512, 3, 512 ] + - Exact: [ 4096, 4096, 3, 1024 ] + - Exact: [ 4103, 4096, 3, 1024 ] + - Exact: [ 4096, 4103, 3, 1024 ] + - Exact: [ 4103, 4103, 3, 1024 ] + - Exact: [ 4096, 4096, 3, 1031 ] + - Exact: [ 4103, 4103, 3, 1031 ] diff --git a/Tensile/Tests/extended/stream_k/sk_2tile_sgemm.yaml b/Tensile/Tests/extended/stream_k/sk_2tile_sgemm.yaml index 96cb4f808..fd62b0f92 100644 --- a/Tensile/Tests/extended/stream_k/sk_2tile_sgemm.yaml +++ b/Tensile/Tests/extended/stream_k/sk_2tile_sgemm.yaml @@ -6,7 +6,7 @@ GlobalParameters: BoundsCheck: True KernelTime: True DataInitTypeAlpha: 1 - DataInitTypeBeta: 0 + DataInitTypeBeta: 1 # DataInitTypeA: 1 # DataInitTypeB: 1 # DataInitTypeC: 1 @@ -30,7 +30,7 @@ BenchmarkProblems: DataType: s TransposeA: False TransposeB: True - UseBeta: False + UseBeta: True Batched: True - # BenchmarkProblemSizeGroup - Standard @@ -91,29 +91,23 @@ BenchmarkProblems: # - NumElementsPerBatchStore: [0, 2, 4, 8] # - NumElementsPerBatchStore: [8] # - AssertAlphaValue: [1] - - AssertSizeEqual: [{2: 1}] BenchmarkForkParameters: JoinParameters: BenchmarkJoinParameters: BenchmarkFinalParameters: - ProblemSizes: - # - Exact: [10912, 10976, 1, 13856] - # - Exact: [16000, 13632, 1, 9040] - # - Range: [ [4096, 7, 6144], [4096, 7, 6144], [1], [1024] ] - # - Range: [ [4096, 31, 5120], [4096, 31, 5120], [1], [1024] ] - # - Range: [ [512], [512], [1], [512] ] - - Range: [ [4096], [4096], [1], [1024] ] - - Range: [ [4103], [4096], [1], [1024] ] - - Range: [ [4096], [4103], [1], [1024] ] - - Range: [ [4103], [4103], [1], [1024] ] - - Range: [ [4096], [4096], [1], [1031] ] - - Range: [ [4103], [4103], [1], [1031] ] - # - Range: [ [4096], [4096], [1], [1024, 1, 1088] ] - # - Range: [ [4096, 31, 5120], [4096, 31, 5120], [1], [1024, 7, 1280] ] - # - Range: [ [4096, 31, 5120], [4096], [1], [1024] ] - # - Range: [ [4096], [4096, 31, 5120], [1], [1024] ] - # - Range: [ [4096], [4096], [1], [1024, 7, 1280] ] - # - Range: [ [1031], [1031], [1], [1031] ] - # - Range: [ [1031], [1031], [8], [1031] ] - # - Range: [ [4096], [4096], [2], [1024] ] + - Exact: [ 512, 512, 1, 512 ] + - Exact: [ 4096, 4096, 1, 1024 ] + - Exact: [ 4103, 4096, 1, 1024 ] + - Exact: [ 4096, 4103, 1, 1024 ] + - Exact: [ 4103, 4103, 1, 1024 ] + - Exact: [ 4096, 4096, 1, 1031 ] + - Exact: [ 4103, 4103, 1, 1031 ] + - Exact: [ 512, 512, 3, 512 ] + - Exact: [ 4096, 4096, 3, 1024 ] + - Exact: [ 4103, 4096, 3, 1024 ] + - Exact: [ 4096, 4103, 3, 1024 ] + - Exact: [ 4103, 4103, 3, 1024 ] + - Exact: [ 4096, 4096, 3, 1031 ] + - Exact: [ 4103, 4103, 3, 1031 ] diff --git a/Tensile/Tests/extended/stream_k/sk_hgemm_hhs.yaml b/Tensile/Tests/extended/stream_k/sk_hgemm_hhs.yaml index 11398db76..b8e3c864b 100644 --- a/Tensile/Tests/extended/stream_k/sk_hgemm_hhs.yaml +++ b/Tensile/Tests/extended/stream_k/sk_hgemm_hhs.yaml @@ -6,7 +6,7 @@ GlobalParameters: BoundsCheck: True KernelTime: True DataInitTypeAlpha: 1 - DataInitTypeBeta: 0 + DataInitTypeBeta: 1 # DataInitTypeA: 1 # DataInitTypeB: 1 # DataInitTypeC: 1 @@ -29,7 +29,7 @@ BenchmarkProblems: HighPrecisionAccumulate: True # True if DataType != ComputeDataType TransposeA: False TransposeB: True - UseBeta: False + UseBeta: True Batched: True - # BenchmarkProblemSizeGroup - Standard @@ -73,16 +73,23 @@ BenchmarkProblems: # - NumElementsPerBatchStore: [8] - AssertAlphaValue: [1] - GlobalReadVectorWidth: [8] - - AssertSizeEqual: [{2: 1}] BenchmarkForkParameters: JoinParameters: BenchmarkJoinParameters: BenchmarkFinalParameters: - ProblemSizes: - - Range: [ [4096], [4096], [1], [1024] ] - - Range: [ [4103], [4096], [1], [1024] ] - - Range: [ [4096], [4103], [1], [1024] ] - - Range: [ [4103], [4103], [1], [1024] ] - - Range: [ [4096], [4096], [1], [1031] ] - - Range: [ [4103], [4103], [1], [1031] ] + - Exact: [ 512, 512, 1, 512 ] + - Exact: [ 4096, 4096, 1, 1024 ] + - Exact: [ 4103, 4096, 1, 1024 ] + - Exact: [ 4096, 4103, 1, 1024 ] + - Exact: [ 4103, 4103, 1, 1024 ] + - Exact: [ 4096, 4096, 1, 1031 ] + - Exact: [ 4103, 4103, 1, 1031 ] + - Exact: [ 512, 512, 3, 512 ] + - Exact: [ 4096, 4096, 3, 1024 ] + - Exact: [ 4103, 4096, 3, 1024 ] + - Exact: [ 4096, 4103, 3, 1024 ] + - Exact: [ 4103, 4103, 3, 1024 ] + - Exact: [ 4096, 4096, 3, 1031 ] + - Exact: [ 4103, 4103, 3, 1031 ] diff --git a/Tensile/Tests/extended/stream_k/sk_sgemm.yaml b/Tensile/Tests/extended/stream_k/sk_sgemm.yaml index b6abd6157..0b1a6049e 100644 --- a/Tensile/Tests/extended/stream_k/sk_sgemm.yaml +++ b/Tensile/Tests/extended/stream_k/sk_sgemm.yaml @@ -6,7 +6,7 @@ GlobalParameters: BoundsCheck: True KernelTime: True DataInitTypeAlpha: 1 - DataInitTypeBeta: 0 + DataInitTypeBeta: 1 # DataInitTypeA: 1 # DataInitTypeB: 1 # DataInitTypeC: 1 @@ -30,7 +30,7 @@ BenchmarkProblems: DataType: s TransposeA: False TransposeB: True - UseBeta: False + UseBeta: True Batched: True - # BenchmarkProblemSizeGroup - Standard @@ -91,29 +91,23 @@ BenchmarkProblems: # - NumElementsPerBatchStore: [0, 2, 4, 8] # - NumElementsPerBatchStore: [8] # - AssertAlphaValue: [1] - - AssertSizeEqual: [{2: 1}] BenchmarkForkParameters: JoinParameters: BenchmarkJoinParameters: BenchmarkFinalParameters: - ProblemSizes: - # - Exact: [10912, 10976, 1, 13856] - # - Exact: [16000, 13632, 1, 9040] - # - Range: [ [4096, 7, 6144], [4096, 7, 6144], [1], [1024] ] - # - Range: [ [4096, 31, 5120], [4096, 31, 5120], [1], [1024] ] - # - Range: [ [512], [512], [1], [512] ] - - Range: [ [4096], [4096], [1], [1024] ] - - Range: [ [4103], [4096], [1], [1024] ] - - Range: [ [4096], [4103], [1], [1024] ] - - Range: [ [4103], [4103], [1], [1024] ] - - Range: [ [4096], [4096], [1], [1031] ] - - Range: [ [4103], [4103], [1], [1031] ] - # - Range: [ [4096], [4096], [1], [1024, 1, 1088] ] - # - Range: [ [4096, 31, 5120], [4096, 31, 5120], [1], [1024, 7, 1280] ] - # - Range: [ [4096, 31, 5120], [4096], [1], [1024] ] - # - Range: [ [4096], [4096, 31, 5120], [1], [1024] ] - # - Range: [ [4096], [4096], [1], [1024, 7, 1280] ] - # - Range: [ [1031], [1031], [1], [1031] ] - # - Range: [ [1031], [1031], [8], [1031] ] - # - Range: [ [4096], [4096], [2], [1024] ] + - Exact: [ 512, 512, 1, 512 ] + - Exact: [ 4096, 4096, 1, 1024 ] + - Exact: [ 4103, 4096, 1, 1024 ] + - Exact: [ 4096, 4103, 1, 1024 ] + - Exact: [ 4103, 4103, 1, 1024 ] + - Exact: [ 4096, 4096, 1, 1031 ] + - Exact: [ 4103, 4103, 1, 1031 ] + - Exact: [ 512, 512, 3, 512 ] + - Exact: [ 4096, 4096, 3, 1024 ] + - Exact: [ 4103, 4096, 3, 1024 ] + - Exact: [ 4096, 4103, 3, 1024 ] + - Exact: [ 4103, 4103, 3, 1024 ] + - Exact: [ 4096, 4096, 3, 1031 ] + - Exact: [ 4103, 4103, 3, 1031 ] diff --git a/tuning/automation/rocblas-benchInputCreator.py b/tuning/automation/rocblas-benchInputCreator.py index f1e159df5..5dd437af4 100644 --- a/tuning/automation/rocblas-benchInputCreator.py +++ b/tuning/automation/rocblas-benchInputCreator.py @@ -1,6 +1,6 @@ ################################################################################ # -# Copyright (C) 2016-2023 Advanced Micro Devices, Inc. All rights reserved. +# Copyright (C) 2016-2024 Advanced Micro Devices, Inc. All rights reserved. # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to deal @@ -127,7 +127,7 @@ def getProblemType(problem): else: problemDict["compute_type"] = problemDict["a_type"] - if problem["F32XdlMathOp"]==9: # XF32 + if "F32XdlMathOp" in problem and problem["F32XdlMathOp"]==9: # XF32 problemDict["math_mode"] = 1 return problemDict From f684ba9db3ba3f8c45de90e06d1ea89d943b4855 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Fri, 19 Jan 2024 02:04:27 +0900 Subject: [PATCH 36/51] Force GlobalReadCoalesceGroupA, B to True (#1869) --- Tensile/SolutionStructs.py | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index 86012f527..d602ccec7 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -3234,6 +3234,14 @@ def assignDerivedParameters(state): #print "staggerStrideShift=", staggerStrideShift, "depthu=", state["DepthU"] state["_staggerStrideShift"] = staggerStrideShift + # force GlobalReadCoalesceGroupA, B = True until we fix fail with trsm (TODO: re-enable) + if not state["GlobalReadCoalesceGroupA"]: + print2("GlobalReadCoalesceGroupA=False not supported for now. Force to True") + state["GlobalReadCoalesceGroupA"] = True + if not state["GlobalReadCoalesceGroupB"]: + print2("GlobalReadCoalesceGroupB=False not supported for now. Force to True") + state["GlobalReadCoalesceGroupB"] = True + # Use GlobalReadVectorWidth if it is not -1 if state["GlobalReadVectorWidth"] != -1: state["GlobalLoadVectorWidthA"] = state["GlobalReadVectorWidth"] From 4dd0550e275a4979061b3505c859a5e605745306 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Sat, 20 Jan 2024 02:44:25 +0900 Subject: [PATCH 37/51] Optimize temp vgpr allocation for ClusterLocalRead (#1868) - added if condition to allocate temp vgpr only for 8bit datatype --- Tensile/KernelWriterAssembly.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 585697148..4d3dba472 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -1633,9 +1633,9 @@ def initKernel(self, kernel, tPA, tPB ): self.Fp16AltTmp = self.G2Lpipe1 + 1 vgprIdx += 1 - # packTmp vgpr for wider local read + v_perm + # packTmp vgpr for wider local read + v_perm + 8bit lrvwTileMax = max(self.lrvwTileA, self.lrvwTileB) - if lrvwTileMax > 1: + if lrvwTileMax > 1 and (kernel["ProblemType"]["DataType"].isInt8() or kernel["ProblemType"]["DataType"].is8bitFloat()): self.vgprPackTemp = vgprIdx vgprIdx += 1 @@ -2718,7 +2718,7 @@ def functionSignature(self, kernel ): kStr += self.macroRegister("vgprFp16AltTmp", self.Fp16AltTmp) lrvwTileMax = max(self.lrvwTileA, self.lrvwTileB) - if lrvwTileMax > 1: + if lrvwTileMax > 1 and (kernel["ProblemType"]["DataType"].isInt8() or kernel["ProblemType"]["DataType"].is8bitFloat()): kStr += self.macroRegister("vgprPackTemp", self.vgprPackTemp) # Serial is always the last register in the pool so the store From efbe0c0caeedcf03776ae4e6a0067d88e38da211 Mon Sep 17 00:00:00 2001 From: Gavin Zhao Date: Wed, 24 Jan 2024 15:57:04 -0500 Subject: [PATCH 38/51] Use fallback libraries for archs without optimized logic (#1862) Fixes #1757. Enables architectures that don't have optimized logic files to also produce libraries when `--separate-architectures` or `--lazy-library-loading` is turned on. Previously, one must disable both of these two flags in order for rocBLAS to run on architectures like `gfx1010`. --- Tensile/TensileCreateLibrary.py | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/Tensile/TensileCreateLibrary.py b/Tensile/TensileCreateLibrary.py index f28ba3119..58751082d 100644 --- a/Tensile/TensileCreateLibrary.py +++ b/Tensile/TensileCreateLibrary.py @@ -940,11 +940,18 @@ def generateLogicDataAndSolutions(logicFiles, args): # logicData[problemType].append((scheduleName, deviceNames, \ # solutionsForSchedule, indexOrder, exactLogic, rangeLogic )) + (archs, _) = splitArchs() if globalParameters["SeparateArchitectures"] or globalParameters["LazyLibraryLoading"]: if "fallback" in masterLibraries.keys(): for key, value in masterLibraries.items(): if key != "fallback": value.merge(deepcopy(masterLibraries["fallback"])) + for archName in archs: + archName = archName.split('-', 1)[0] + if archName not in masterLibraries: + print1("Using fallback for arch: " + archName) + masterLibraries[archName] = deepcopy(masterLibraries["fallback"]) + masterLibraries[archName].version = args.version masterLibraries.pop("fallback") From 0f367a5fe81860eda65048372be506b4bcaf1616 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Fri, 26 Jan 2024 00:52:23 +0900 Subject: [PATCH 39/51] DirectToVgpr + packing support, increase extended test timeout (#1872) - enabled DirectToVgpr + packing for f8/f16 + TLU cases - enabled negative values for ExtraLatencyForLR to reduce interval of local read and wait for DTV - added test cases for DirectToVgpr + packing - Increase extended test timeout to 720 min --- .jenkins/extended.groovy | 2 +- Tensile/Common.py | 3 +- Tensile/Components/LocalRead.py | 4 + Tensile/KernelWriter.py | 150 +++++++--- Tensile/KernelWriterAssembly.py | 123 +++++--- Tensile/SolutionStructs.py | 74 +++-- .../extended/direct_to_vgpr/dtv_f8gemm.yaml | 219 +++++++++++++++ .../extended/direct_to_vgpr/dtv_hgemm.yaml | 262 +++++++++++++++++- 8 files changed, 729 insertions(+), 108 deletions(-) diff --git a/.jenkins/extended.groovy b/.jenkins/extended.groovy index 62b0498a4..d89378d06 100644 --- a/.jenkins/extended.groovy +++ b/.jenkins/extended.groovy @@ -45,7 +45,7 @@ def runCI = boolean formatCheck = false - prj.timeout.test = 600 + prj.timeout.test = 720 prj.defaults.ccache = false def commonGroovy diff --git a/Tensile/Common.py b/Tensile/Common.py index 47c762a00..3a269f461 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -1318,7 +1318,8 @@ def getArchitectureName(gfxName): "ExtraMiLatencyLeft": list(range(0,9,2)), # Add extra latency to calculate number of MFMA to insert between local read and wait - "ExtraLatencyForLR": list(range(0,17,2)), + # Negative value means reduce interval between local read and wait (for DirectToVgpr only) + "ExtraLatencyForLR": list(range(0,17,2)) + list(range(-80,0,10)), # Allocate dedicated vgpr for local read with packing # False: use tmp vgpr. Less vgpr usage, but not best for local read scheduling diff --git a/Tensile/Components/LocalRead.py b/Tensile/Components/LocalRead.py index 8edca8896..c51f69eb0 100644 --- a/Tensile/Components/LocalRead.py +++ b/Tensile/Components/LocalRead.py @@ -363,4 +363,8 @@ def __call__(self, writer, bufferIdx, iui, epsi, tP): elif kernel["ProblemType"]["DataType"].isSingle(): localReadCode.addCode(writer.assert_eq( dbgVgpr, 1.0) ) + # DTV case, do not return local read code. Return pack code only. + if kernel["DirectToVgpr%s"%tc]: + return Code.Module(), pack + return imod, pack diff --git a/Tensile/KernelWriter.py b/Tensile/KernelWriter.py index 19d36082b..a2e490218 100644 --- a/Tensile/KernelWriter.py +++ b/Tensile/KernelWriter.py @@ -1496,7 +1496,9 @@ def makeSubIterSchedule(self, kernel, localReadCode, iteration, pointerLWCode, p if count: # insert 1 nop instruction iterCode.addInst("s_nop ",str(count - 1),"VALU packing writes to be consumed by matrix instruction") - if i == numMfmaPerIter - 1: + # the final mfma or DirectToVgpr + PGR2 case, we need to generate all remaining pack instructions + # otherwise, DTV global load can overwrite pack register values + if i == numMfmaPerIter - 1 or len(list(globalReadCodeDTV.items())) > 0: while packItems: iterCode.addCode(packItems.pop(0)) @@ -2013,6 +2015,13 @@ def noLoadLoopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack # if this is the last NoLoadLoop(NLLlast) and self.tailLoopInNLL case, set tail=True for mfmaIter needTailCode = NLLlast and self.tailLoopInNLL + # vregSetIdx for DTV + # NGLL case, use first set. NLL case, use second set + vregSetIdxMFMA = 0 if isNGLL else 1 + # flip vregSetIdx if isDTVodd is True + if isDTVodd: + vregSetIdxMFMA = 1 - vregSetIdxMFMA + for uIdx in range(0, kernel["LoopIters"]*kernel["DepthULdsDivisor"]): u = uIdx % kernel["LoopIters"] # u: index in compute loop (in contrast to the notion of global read loop) uDu = uIdx // kernel["LoopIters"] # uDu: index of compute loop @@ -2072,6 +2081,7 @@ def noLoadLoopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack kl.append(self.comment("iter %u%s"%(u,extraComment))) plrIdx = ((u+pflr) % (self.numVgprBuffer+1)) % kernel["LoopIters"] + plrIdxDTV = (u+pflr) % kernel["LoopIters"] localReads = Code.Module() pointerLWCode = Code.Module() @@ -2081,12 +2091,23 @@ def noLoadLoopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack waitLWCode = Code.Module() syncCode = Code.Module() + # vregSetIdx for DTV + vregSetIdxLR = vregSetIdxMFMA + if kernel["LoopIters"] > 1 and u == kernel["LoopIters"] - 1 and \ + not ( isNGLL and (not isDTVodd) and self.generateDTVodd): + # use next vregSet for the last loopIter + # exception for isNGLL and not isDTVodd and odd code enabled case + # in this case, we need to flip twice (for NGLL to NLL, even to odd) + # then, we do not need to flip vregSetIdxLR + vregSetIdxLR = 1 - vregSetIdxLR + if self.enable["LocalRead"]: hasLiveLdsData = kernel["PrefetchGlobalRead"] or (uDu < kernel["DepthULdsDivisor"]-1) hasLiveLdsData = hasLiveLdsData and not isLastLoop # for DirectToVgpr + DTVodd # need to call localReadDo to allocate tmpVgpr for the next DTVeven case (no actual asm code generated for DTV) needExtraLocalReadDo = (NLLlast and isDTVodd and u > localWriteEndIter) + # DTV pack case, generate local read code for DTVodd case hasLiveLdsData = hasLiveLdsData or needExtraLocalReadDo # reads for current loop are done in previous iteration because of wider local read doReadA = (u < kernel["LoopIters"]/self.numIterPerCoalescedReadA - self.numItersPLR) @@ -2094,9 +2115,6 @@ def noLoadLoopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack # reads for next loop doReadA = doReadA or (hasLiveLdsData and u > localWriteEndIter) doReadB = doReadB or (hasLiveLdsData and u > localWriteEndIter) - # disable LocalRead if DirectToVgpr is enabled - doReadA = doReadA and (not kernel["DirectToVgprA"]) - doReadB = doReadB and (not kernel["DirectToVgprB"]) for iui in range(0,kernel["InnerUnroll"]): doReadA = doReadA and iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"] doReadB = doReadB and iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"] @@ -2105,19 +2123,33 @@ def noLoadLoopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack # just need to call localReadDo to allocate tmpVgpr if not needExtraLocalReadDo: localReads.addText(self.comment("local read a")) - localReadCodeA, packCodeA = self.localReadDo(kernel, plrIdx*self.numIterPerCoalescedReadA, iui*self.numReadsIterCoalescedA, 0, tensorParametersA) + bufferIdx = plrIdx*self.numIterPerCoalescedReadA + if self.packDTVA: + # DTV + pack case, offset bufferIdx for local read packing instructions + bufferIdx = plrIdxDTV*self.numIterPerCoalescedReadA + vregSetIdxLR * kernel["LoopIters"] + localReadCodeA, packCodeA = self.localReadDo(kernel, bufferIdx, iui*self.numReadsIterCoalescedA, 0, tensorParametersA) if not needExtraLocalReadDo: localReads.addCode(localReadCodeA) pack[plrIdx*self.numIterPerCoalescedReadA].addCode(packCodeA) + if needExtraLocalReadDo and (self.packDTVA or self.packDTVB): + # packDTV + needExtraLocalReadDo, need to update pack code to flip vregSetIdx + pack[plrIdx*self.numIterPerCoalescedReadA].addCode(packCodeA) if doReadB: # needExtraLocalReadDo only case, no need to generate actual code # just need to call localReadDo to allocate tmpVgpr if not needExtraLocalReadDo: localReads.addText(self.comment("local read b")) - localReadCodeB, packCodeB = self.localReadDo(kernel, plrIdx*self.numIterPerCoalescedReadB, iui*self.numReadsIterCoalescedB, 0, tensorParametersB) + bufferIdx = plrIdx*self.numIterPerCoalescedReadB + if self.packDTVB: + # DTV + pack case, offset bufferIdx for local read packing instructions + bufferIdx = plrIdxDTV*self.numIterPerCoalescedReadB + vregSetIdxLR * kernel["LoopIters"] + localReadCodeB, packCodeB = self.localReadDo(kernel, bufferIdx, iui*self.numReadsIterCoalescedB, 0, tensorParametersB) if not needExtraLocalReadDo: localReads.addCode(localReadCodeB) pack[plrIdx*self.numIterPerCoalescedReadB].addCode(packCodeB) + if needExtraLocalReadDo and (self.packDTVA or self.packDTVB): + # packDTV + needExtraLocalReadDo, need to update pack code to flip vregSetIdx + pack[plrIdx*self.numIterPerCoalescedReadB].addCode(packCodeB) if (not isResetLroIter or iui != kernel["InnerUnroll"]-1): if doReadA: localReads.addText(self.comment("local read increment a")) @@ -2202,13 +2234,6 @@ def noLoadLoopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack luIdx = (u) % (self.numVgprBuffer+1) # local to use for MACs if self.enable["MAC"]: if kernel["EnableMatrixInstruction"]: - # NGLL case, use first set - setId = 0 if isNGLL else 1 - # flip setId if isDTVodd is True - if isDTVodd: - setId = 1 - setId - # use second set for DirectToVGPR - vregSetIdxMFMA = setId # use first set for NGLL, second set for other cases if ((uIdx+1) == kernel["LoopIters"]*kernel["DepthULdsDivisor"]) and \ (kernel["StoreCInUnroll"]): lastuIdx = (isOptNLL or self.enableSingleNLLOpt) and not isNGLL # do not apply lastuIdx for not isOptNLL case @@ -2337,9 +2362,7 @@ def noLoadLoop( self, kernel, tensorParametersA, tensorParametersB, isOptNLL, is kl.append(self.syncThreads(kernel)) # if DirectToVgpr and ASEM/GSU is not multiple of DepthU*2, generate noLoadLoopBody twice for odd and even exit separately - asem = kernel["AssertSummationElementMultiple"] - gsu = kernel["GlobalSplitU"] - if ( kernel["DirectToVgprA"] or kernel["DirectToVgprB"]) and ((asem%gsu != 0) or (asem//gsu) % (kernel["DepthU"] * 2) != 0): + if self.generateDTVodd: # generate additional No Load Loop Body code for odd case (to use the other Vreg set for DirectToVgpr) # 1. generate odd check name = "" @@ -2356,8 +2379,8 @@ def noLoadLoop( self, kernel, tensorParametersA, tensorParametersB, isOptNLL, is # backup self.saveLocalPointers(kernel) # copy pack - if isNGLL: - # NGLL case, no deep copy for pack + if isNGLL or (self.packDTVA or self.packDTVB): + # NGLL or pack DTV case, no deep copy for pack # pack code for local prefetch is generated in noLoadLoopBody and used for DTV even deepCopyPack = pack else: @@ -2533,20 +2556,20 @@ def loopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack, lc, for plrIdx in range(0, self.numItersPLR): pack[plrIdx] = Code.Module() for iui in range(0,kernel["InnerUnroll"]): - if iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"] and (not kernel["DirectToVgprA"]) : # no local read code if DirectToVgpr is enabled + if iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"]: kl.append(self.comment("prefetch local a")) localReadCodeA, packCodeA = self.localReadDo(kernel, plrIdx*self.numIterPerCoalescedReadA, iui*self.numReadsIterCoalescedA, 0, tensorParametersA) kl.append(localReadCodeA) pack[plrIdx].addCode(packCodeA) - if iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"] and (not kernel["DirectToVgprB"]) : # no local read code if DirectToVgpr is enabled + if iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"]: kl.append(self.comment("prefetch local b")) localReadCodeB, packCodeB = self.localReadDo(kernel, plrIdx*self.numIterPerCoalescedReadB, iui*self.numReadsIterCoalescedB, 0, tensorParametersB) kl.append(localReadCodeB) pack[plrIdx].addCode(packCodeB) - if iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"] and (not kernel["DirectToVgprA"]) : # no local read code if DirectToVgpr is enabled + if iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"]: kl.append(self.comment1("local read increment a")) kl.append(self.localReadInc(kernel, iui, tensorParametersA)) - if iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"] and (not kernel["DirectToVgprB"]) : # no local read code if DirectToVgpr is enabled + if iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"]: kl.append(self.comment1("local read increment b")) kl.append(self.localReadInc(kernel, iui, tensorParametersB)) @@ -2554,6 +2577,8 @@ def loopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack, lc, kl.append(self.openString(kernel)) pflr = self.numItersPLR # how many pf already done above + # vregSetIdx for DTV + vregSetIdxMFMA = lc ############################################################################ # unrolled loop: mac iterations @@ -2631,6 +2656,7 @@ def loopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack, lc, kl.append(self.comment("iter %u%s"%(u,extraComment))) plrIdx = ((u+pflr) % (self.numVgprBuffer+1)) % kernel["LoopIters"] + plrIdxDTV = (u+pflr) % kernel["LoopIters"] localReads = Code.Module() localReadsA = Code.Module() @@ -2643,6 +2669,22 @@ def loopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack, lc, waitLWCode = Code.Module() syncCode = Code.Module() + # vregSetIdx for DTV + vregSetIdxLR = vregSetIdxMFMA + if kernel["LoopIters"] > 1 and u == kernel["LoopIters"] - 1: + # use next vregSet for the last loopIter (exception: LoopIters==1) + # LoopIters==1 case, local read is for the current iteration and not for the next iteration + vregSetIdxLR = (vregSetIdxLR + 1) % loopCopies + # final loop case, use vregSetIdx for noLoadLoop (NGLL(PGR2) or NLL(PGR1)) + if finalLoop: + # finalLoop case, this is for NoLoadLoop (NGLL(PGR2) or NLL(PGR1)) + # PGR2 case, next is NGLL. Use first set + # PGR1 case, next is NLL. Use second set + vregSetIdxLR = 0 if kernel["PrefetchGlobalRead"] == 2 else 1 + # flip vregSetIdx if isDTVodd is True + if self.generateDTVodd: + vregSetIdxLR = 1 - vregSetIdxLR + if self.enable["LocalRead"]: hasLiveLdsData = kernel["PrefetchGlobalRead"] or (uDu < kernel["DepthULdsDivisor"]-1) # reads for current loop are done in previous iteration because of wider local read @@ -2652,20 +2694,26 @@ def loopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack, lc, doReadA = doReadA or (hasLiveLdsData and u > localWriteEndIter) doReadB = doReadB or (hasLiveLdsData and u > localWriteEndIter) # disable LocalRead if DirectToVgpr is enabled - doReadA = doReadA and (not kernel["DirectToVgprA"]) - doReadB = doReadB and (not kernel["DirectToVgprB"]) for iui in range(0,kernel["InnerUnroll"]): doReadA = doReadA and iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"] doReadB = doReadB and iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"] if doReadA: localReads.addText(self.comment("local read a")) - localReadCodeA, packCodeA = self.localReadDo(kernel, plrIdx*self.numIterPerCoalescedReadA, iui*self.numReadsIterCoalescedA, 0, tensorParametersA) + bufferIdx = plrIdx*self.numIterPerCoalescedReadA + if self.packDTVA: + # DTV + pack case, offset bufferIdx for local read packing instructions + bufferIdx = plrIdxDTV*self.numIterPerCoalescedReadA + vregSetIdxLR * kernel["LoopIters"] + localReadCodeA, packCodeA = self.localReadDo(kernel, bufferIdx, iui*self.numReadsIterCoalescedA, 0, tensorParametersA) localReads.addCode(localReadCodeA) localReadsA.addCode(localReadCodeA) pack[plrIdx*self.numIterPerCoalescedReadA].addCode(packCodeA) if doReadB: localReads.addText(self.comment("local read b")) - localReadCodeB, packCodeB = self.localReadDo(kernel, plrIdx*self.numIterPerCoalescedReadB, iui*self.numReadsIterCoalescedB, 0, tensorParametersB) + bufferIdx = plrIdx*self.numIterPerCoalescedReadB + if self.packDTVB: + # DTV + pack case, offset bufferIdx for local read packing instructions + bufferIdx = plrIdxDTV*self.numIterPerCoalescedReadB + vregSetIdxLR * kernel["LoopIters"] + localReadCodeB, packCodeB = self.localReadDo(kernel, bufferIdx, iui*self.numReadsIterCoalescedB, 0, tensorParametersB) localReads.addCode(localReadCodeB) localReadsB.addCode(localReadCodeB) pack[plrIdx*self.numIterPerCoalescedReadB].addCode(packCodeB) @@ -2758,7 +2806,6 @@ def loopBody( self, kernel, tensorParametersA, tensorParametersB, kl, pack, lc, luIdx = (u) % (self.numVgprBuffer+1) # local to use for MACs if self.enable["MAC"]: if kernel["EnableMatrixInstruction"]: - vregSetIdxMFMA = lc macIterCode.addCode(self.mfmaIter(kernel, u, kernel["InnerUnroll"], vregSetIdxMFMA, firstIter=firstIter and u == 0)) else: macIterCode.addCode(self.macIter(kernel, luIdx, kernel["InnerUnroll"], True )) @@ -3138,20 +3185,20 @@ def kernelBody( self, kernel, tensorParametersA, tensorParametersB ): # for espi in range(0, (self.prefetchAcrossPersistent and kernel["ExpandPointerSwap"])+1): for espi in range(0, 1): for iui in range(0,kernel["InnerUnroll"]): - if iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"] and (not kernel["DirectToVgprA"]) : # no local read code if DirectToVgpr is enabled + if iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"]: kl.append(self.comment("local read prefetch a")) localReadCodeA, packCodeA = self.localReadDo(kernel, plrIdx*self.numIterPerCoalescedReadA, iui*self.numReadsIterCoalescedA, espi, tensorParametersA) kl.append(localReadCodeA) pack[plrIdx].addCode(packCodeA) - if iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"] and (not kernel["DirectToVgprB"]) : # no local read code if DirectToVgpr is enabled + if iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"]: kl.append(self.comment("local read prefetch b")) localReadCodeB, packCodeB = self.localReadDo(kernel, plrIdx*self.numIterPerCoalescedReadB, iui*self.numReadsIterCoalescedB, espi, tensorParametersB) kl.append(localReadCodeB) pack[plrIdx].addCode(packCodeB) - if iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"] and (not kernel["DirectToVgprA"]) : # no local read code if DirectToVgpr is enabled + if iui*self.numReadsIterCoalescedA < kernel["InnerUnroll"]: kl.append(self.comment("local read inc a")) kl.append(self.localReadInc(kernel, iui, tensorParametersA)) - if iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"] and (not kernel["DirectToVgprB"]) : # no local read code if DirectToVgpr is enabled + if iui*self.numReadsIterCoalescedB < kernel["InnerUnroll"]: kl.append(self.comment("local read inc b")) kl.append(self.localReadInc(kernel, iui, tensorParametersB)) kl.append(self.closeSumAtLeastUnroll(kernel, prefetch=True, isOptNLL=False, isPap=False, isNGLL=False)) @@ -3422,31 +3469,33 @@ def kernelBody( self, kernel, tensorParametersA, tensorParametersB ): # print tail loop counter if mEnd>1 (means do tail loop unroll) kl.append(self.comment("tail loop unroll iter %u"%(mValue))) pack[0] = Code.Module() + # always use vregSetIdx=0 for DirectToVgpr + tail loop + vregSetIdxMFMA = 0 for iui in range(0, tailLoopInnerUnroll): if self.enable["LocalRead"]: - doReadA = not kernel["DirectToVgprA"] - doReadB = not kernel["DirectToVgprB"] # local read buffer id. No prefetch in tail loop case. bufIdx = (mValue % (self.numVgprBuffer+1)) % kernel["LoopIters"] - if mValue*self.numReadsIterCoalescedA < mEnd and doReadA: + # DTVpack case, use different bufIdx for all loop iterations + bufIdxDTV = mValue % kernel["LoopIters"] + bufIdxA = bufIdxDTV if self.packDTVA else bufIdx + bufIdxB = bufIdxDTV if self.packDTVB else bufIdx + if mValue*self.numReadsIterCoalescedA < mEnd: # Reading 16-bit data from LDS requires packing when ECC enabled kl.append(self.comment("local read a")) - localReadCodeA, packCodeA = self.localReadDo(kernel, bufIdx*self.numIterPerCoalescedReadA, iui*self.numIterPerCoalescedReadA, 0, tensorParametersA) + localReadCodeA, packCodeA = self.localReadDo(kernel, bufIdxA*self.numIterPerCoalescedReadA, iui*self.numIterPerCoalescedReadA, 0, tensorParametersA) kl.append(localReadCodeA) pack[0].addCode(packCodeA) - if mValue*self.numReadsIterCoalescedB < mEnd and doReadB: + if mValue*self.numReadsIterCoalescedB < mEnd: kl.append(self.comment("local read b")) - localReadCodeB, packCodeB = self.localReadDo(kernel, bufIdx*self.numIterPerCoalescedReadB, iui*self.numIterPerCoalescedReadB, 0, tensorParametersB) + localReadCodeB, packCodeB = self.localReadDo(kernel, bufIdxB*self.numIterPerCoalescedReadB, iui*self.numIterPerCoalescedReadB, 0, tensorParametersB) kl.append(localReadCodeB) pack[0].addCode(packCodeB) # adjustment for DirectToLds case iuiParam = iui + tailLoopInnerUnroll * mValue - if doReadA: - kl.append(self.comment("local read inc a")) - kl.append(self.localReadInc(kernel, iuiParam, tensorParametersA)) - if doReadB: - kl.append(self.comment("local read inc b")) - kl.append(self.localReadInc(kernel, iuiParam, tensorParametersB)) + kl.append(self.comment("local read inc a")) + kl.append(self.localReadInc(kernel, iuiParam, tensorParametersA)) + kl.append(self.comment("local read inc b")) + kl.append(self.localReadInc(kernel, iuiParam, tensorParametersB)) if self.enable["Wait"]: kl.append(self.wait(kernel, tensorParametersA, tensorParametersB, -1, -1, 0, "4wait for local read")) @@ -3748,6 +3797,12 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): self.tailLoopInNLL = noTailLoop >= 2 self.noEarlyExitForTailLoopInNLL = noTailLoop == 3 + # DTV odd check + # need DTV odd code if (asem//GSU) is not multiple of DepthU*2 + self.generateDTVodd = False + if ( kernel["DirectToVgprA"] or kernel["DirectToVgprB"]) and (asemDivGSU % (kernel["DepthU"] * 2) != 0): + self.generateDTVodd = True + self.actualSummationLoops = 1 if kernel["PackSummationDims"] else kernel["ProblemType"]["NumIndicesSummation"] self.otherSummationLoops = self.actualSummationLoops-1 self.otherSummations = kernel["ProblemType"]["NumIndicesSummation"]-1 # not loops but summations vars @@ -3895,6 +3950,9 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): self.lrvwTileA = min(kernel["MIInputPerThread"], kernel["VectorWidthA"]) # should not exceed MIInputPerThread if (not kernel["UnrollMajorLDSB"]): self.lrvwTileB = min(kernel["MIInputPerThread"], kernel["VectorWidthB"]) # should not exceed MIInputPerThread + # DirectToVgpr + pack (v_perm) + self.packDTVA = kernel["DirectToVgprA"] and self.lrvwTileA > 1 + self.packDTVB = kernel["DirectToVgprB"] and self.lrvwTileB > 1 self.numItersPLR = kernel["PrefetchLocalRead"]%kernel["LoopIters"] self.numVgprBuffer = kernel["LoopIters"] if kernel["PrefetchLocalRead"] > kernel["LoopIters"] else kernel["PrefetchLocalRead"] @@ -4236,7 +4294,11 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): self.swapMfmaInnerLoop = True if (not kernel["ProblemType"]["DataType"].isComplex()) and kernel["DirectToVgprA"] and kernel["PrefetchGlobalRead"] == 2: # not Complex and DTVA + PGR2 case, use B for inner loop to schedule more mfma between DTVA global read instructions - self.swapMfmaInnerLoop = True + # exception: both A and B pack code case + needPackAB = kernel["EnableMatrixInstruction"] and kernel["MIInputPerThread"] > 1 and \ + ((not kernel["UnrollMajorLDSA"]) and (not kernel["UnrollMajorLDSB"])) + if not needPackAB: + self.swapMfmaInnerLoop = True # init code optimization # generate local read/write address code and global read tile offset code before wait for kernel arg load (if applicable) diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 4d3dba472..1e74f5a47 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -1278,7 +1278,11 @@ def initKernel(self, kernel, tPA, tPB ): self.numVgprValuC = (kernel["ThreadTile0"]*kernel["ThreadTile1"]*self.bpeCinternal)//self.bpr PLR = kernel["PrefetchLocalRead"] if kernel["PrefetchLocalRead"] < kernel["LoopIters"] else kernel["LoopIters"] - 1 - valuBlocks = (1+PLR) * kernel["InnerUnroll"] + + PLRplus1A = (1+PLR) if not self.packDTVA else kernel["LoopIters"] + PLRplus1B = (1+PLR) if not self.packDTVB else kernel["LoopIters"] + valuBlocksA = PLRplus1A * kernel["InnerUnroll"] + valuBlocksB = PLRplus1B * kernel["InnerUnroll"] if kernel["EnableMatrixInstruction"]: self.numVgprValuAPerBlock = kernel["MIWaveTileA"] * kernel["MIInputPerThread"] * tPA["bpe"] // self.bpr self.numVgprValuBPerBlock = kernel["MIWaveTileB"] * kernel["MIInputPerThread"] * tPB["bpe"] // self.bpr @@ -1300,13 +1304,13 @@ def initKernel(self, kernel, tPA, tPB ): self.numVgprValuBPerBlock = kernel["ThreadTileB"] # change numVgprValuAPerBlock to 0 for A if DirectToVgpr is enabled - if kernel["DirectToVgprA"]: + if kernel["DirectToVgprA"] and not self.packDTVA: self.numVgprValuAPerBlock = 0 - self.numVgprValuA = self.numVgprValuAPerBlock * valuBlocks + self.numVgprValuA = self.numVgprValuAPerBlock * valuBlocksA # change numVgprValuBPerBlock to 0 for B if DirectToVgpr is enabled - if kernel["DirectToVgprB"]: + if kernel["DirectToVgprB"] and not self.packDTVB: self.numVgprValuBPerBlock = 0 - self.numVgprValuB = self.numVgprValuBPerBlock * valuBlocks + self.numVgprValuB = self.numVgprValuBPerBlock * valuBlocksB if self.archCaps["HasEccHalf"]: self.needPackA = tPA["bpe"] < self.bpr and (not kernel["UnrollMajorLDSA"]) and kernel["EnableMatrixInstruction"] @@ -1322,11 +1326,14 @@ def initKernel(self, kernel, tPA, tPB ): needVgprForPack = self.needPackA and kernel["VgprForLocalReadPacking"] if needVgprForPack: if self.lrvwTileA > 1: - self.numVgprValuA //= (1+PLR) + self.numVgprValuA //= PLRplus1A numLoadPerReg = max(1, int(self.numElemPerBprA)//self.lrvwTileA) - valuBlocksPack = (1+PLR) * numLoadPerReg + valuBlocksPack = PLRplus1A * numLoadPerReg else: - valuBlocksPack = (int(self.numElemPerBprA) - 1) + valuBlocksPack = (int(self.numElemPerBprA) - 1) + if self.packDTVA: + # pack DTV case, double the number of blocks + valuBlocksPack *= 2 self.numVgprValuPackA = self.numVgprValuA * valuBlocksPack self.numVgprValuPackB =0 @@ -1334,11 +1341,14 @@ def initKernel(self, kernel, tPA, tPB ): needVgprForPack = self.needPackB and kernel["VgprForLocalReadPacking"] if needVgprForPack: if self.lrvwTileB > 1: - self.numVgprValuB //= (1+PLR) + self.numVgprValuB //= PLRplus1B numLoadPerReg = max(1, int(self.numElemPerBprB)//self.lrvwTileB) - valuBlocksPack = (1+PLR) * numLoadPerReg + valuBlocksPack = PLRplus1B * numLoadPerReg else: valuBlocksPack = (int(self.numElemPerBprB) - 1) + if self.packDTVB: + # pack DTV case, double the number of blocks + valuBlocksPack *= 2 self.numVgprValuPackB = self.numVgprValuB * valuBlocksPack #################################### @@ -1492,9 +1502,13 @@ def initKernel(self, kernel, tPA, tPB ): vgprIdx += self.numVgprValuPackA self.startVgprG2LA = None if not kernel["DirectToLdsA"] or self.do["KeepDirectToLdsAlloc"]: + if self.packDTVA: + # DirectToVgpr + packing + # overlap G2LA and ValuPackA + self.startVgprG2LA = self.startVgprValuPackA # if PGR = True, PAP could be possibly enabled, we move G2LA later to prevent it from being reclaimed # otherwise, put G2L here since it can overlap valu - if not kernel["PrefetchGlobalRead"] and not kernel.enabledSplitLDS: # g2l can overlap valu + elif not kernel["PrefetchGlobalRead"] and not kernel.enabledSplitLDS: # g2l can overlap valu self.startVgprG2LA = self.startVgprValuA vgprIdx = self.startVgprValuA \ + max(self.numVgprValuA + self.numVgprValuPackA, self.numVgprG2LA) @@ -1508,9 +1522,13 @@ def initKernel(self, kernel, tPA, tPB ): vgprIdx += self.numVgprValuPackB self.startVgprG2LB = None if not kernel["DirectToLdsB"] or self.do["KeepDirectToLdsAlloc"]: + if self.packDTVB: + # DirectToVgpr + packing + # overlap G2LB and ValuPackB + self.startVgprG2LB = self.startVgprValuPackB # if PGR = True, PAP could be possibly enabled, we move G2LB later to prevent it from being reclaimed # otherwise, put G2L here since it can overlap valu - if not kernel["PrefetchGlobalRead"] and not kernel.enabledSplitLDS: # g2l can overlap valu + elif not kernel["PrefetchGlobalRead"] and not kernel.enabledSplitLDS: # g2l can overlap valu self.startVgprG2LB = self.startVgprValuB vgprIdx = self.startVgprValuB \ + max(self.numVgprValuB + self.numVgprValuPackB, self.numVgprG2LB) @@ -2585,7 +2603,11 @@ def functionSignature(self, kernel ): numBi = PLR+1 ri = 0 if self.numVgprValuA > 0: # Do not generate vgprValuA if numVgprValuA is 0 - for bi in range(0,numBi): # buffer indices + numBiFactor = numBi + if kernel["DirectToVgprA"] and self.lrvwTileA > 1: + # DirectToVgpr case, we need LoopIters * 2 buffers + numBiFactor = kernel["LoopIters"] * 2 + for bi in range(0,numBiFactor): # buffer indices for iui in range(0, kernel["InnerUnroll"]): kStr += self.macroRegister("vgprValuA_X%u_I%u"%(bi,iui), self.startVgprValuA+ri) ri += self.numVgprValuAPerBlock @@ -2594,9 +2616,9 @@ def functionSignature(self, kernel ): if self.numVgprValuPackA > 0: ri = 0 if self.lrvwTileA > 1: - for data in range(0,kernel["MIInputPerThread"]): - for bi in range(0,numBi): # buffer indices - for iui in range(0, kernel["InnerUnroll"]): + for bi in range(0,numBiFactor): # buffer indices + for iui in range(0, kernel["InnerUnroll"]): + for data in range(0,kernel["MIInputPerThread"]): kStr += self.macroRegister("vgprValuA_X%u_I%u_D%u"%(bi,iui,data), self.startVgprValuPackA+ri) ri += ceil(self.lrvwTileA * self.tPA["bpe"] / self.bpr) * kernel["MIWaveTileA"] // self.lrvwTileA else: @@ -2614,7 +2636,11 @@ def functionSignature(self, kernel ): ri = 0 if self.numVgprValuB > 0: # Do not generate vgprValuB if numVgprValuB is 0 - for bi in range(0,numBi): # buffer indices + numBiFactor = numBi + if kernel["DirectToVgprB"] and self.lrvwTileB > 1: + # DirectToVgpr case, we need LoopIters * 2 buffers + numBiFactor = kernel["LoopIters"] * 2 + for bi in range(0,numBiFactor): # buffer indices for iui in range(0, kernel["InnerUnroll"]): kStr += self.macroRegister("vgprValuB_X%u_I%u"%(bi,iui), self.startVgprValuB+ri) ri += self.numVgprValuBPerBlock @@ -2623,14 +2649,14 @@ def functionSignature(self, kernel ): if self.numVgprValuPackB > 0: ri = 0 if self.lrvwTileB > 1: - for data in range(0,kernel["MIInputPerThread"]): - for bi in range(0,numBi): # buffer indices - for iui in range(0, kernel["InnerUnroll"]): + for bi in range(0,numBiFactor): # buffer indices + for iui in range(0, kernel["InnerUnroll"]): + for data in range(0,kernel["MIInputPerThread"]): kStr += self.macroRegister("vgprValuB_X%u_I%u_D%u"%(bi,iui,data), self.startVgprValuPackB+ri) ri += ceil(self.lrvwTileB * self.tPB["bpe"] / self.bpr) * kernel["MIWaveTileB"] // self.lrvwTileB else: for data in range(1,int(self.numElemPerBprB)): - for bi in range(0,numBi): # buffer indices + for bi in range(0,numBiFactor): # buffer indices for iui in range(0, kernel["InnerUnroll"]): kStr += self.macroRegister("vgprValuB_X%u_I%u_D%u"%(bi,iui,data), self.startVgprValuPackB+ri) ri += self.numVgprValuBPerBlock @@ -4077,6 +4103,9 @@ def graTileAssignment(self, kernel, tP): dividendReg = self.vgprPool.checkOut(1, "idInWave", self.preventVgprOverflowDuringNewTile) kStr += vectorStaticRemainder(dividendReg, "Serial", divisorVal, tmpSgpr) + # store DirectToVgpr K interval for later use + dtvKInterval = 1 + if kernel["DirectToVgpr%s"%tc]: # offset calculation for DirectToVgpr # ported code from local read for DirectToVgpr @@ -4161,7 +4190,11 @@ def graTileAssignment(self, kernel, tP): tluOther = kernel["ProblemType"]["TLUB"] if tP["isA"] else kernel["ProblemType"]["TLUA"] # The other side of tlu if lrvwOther >= 2 and (not tluOther) and tP["tlu"]: # DirectToVgpr + LocalReadVectorWidth>=2 case, multiply qReg by lrvwOther - kStr += staticMultiply(vgpr(qReg), vgpr(qReg), lrvwOther, sgpr(tmpSgpr)) + dtvKInterval = lrvwOther + if tluOther and tP["tlu"]: + # DirectToVgpr + both TLU case, multiply qReg by kernel["MIInputPerThread"] + dtvKInterval = kernel["MIInputPerThread"] + kStr += staticMultiply(vgpr(qReg), vgpr(qReg), dtvKInterval, sgpr(tmpSgpr)) else: divisor2 = divisor @@ -4231,6 +4264,12 @@ def graTileAssignment(self, kernel, tP): tP["gpr"]["tReg"] = tReg2 tP["gpr"]["uReg"] = uReg + # store DirectToVgpr K interval for later use + if tP["isA"]: + self.dtvKIntervalA = dtvKInterval + else: + self.dtvKIntervalB = dtvKInterval + return "" if self.dontAppendCode else kStr ############################################################################## @@ -4420,47 +4459,47 @@ def graUnrollOffsets(self, kernel, tP): stride = kernel[strideIdx] prevStride = 0 totalStride = 0 - lrvwOther = self.lrvwB if tP["isA"] else self.lrvwA # The other side of lrvw - tluOther = kernel["ProblemType"]["TLUB"] if tP["isA"] else kernel["ProblemType"]["TLUA"] # The other side of tlu bpeOffset = 1 if tP["glvw"] >= 1 else tP["bpe"] # glvw<1 case, need to multiply strideValue by bpe + dtvKInterval = self.dtvKIntervalA if tP["isA"] else self.dtvKIntervalB + if tP["ruc"]: # l=0, s=0 kStr += inst("v_mov_b32", vgpr(v), \ - vgpr(tP["gpr"]["uReg"]), "gro%s%s_%u_s%u"%(tP["tensorChar"], self.unrollChar, 0, 0) ) + vgpr(tP["gpr"]["uReg"]), "gro%s%s_%u_s%u"%(tc, self.unrollChar, 0, 0) ) # l=0, s>0 for s in range(1, tP["glvw"]): kStr += inst("_v_add_co_u32", vgpr(v+s), self.vcc, 1, \ - vgpr(v+s-1), "gro%s%s_%u_s%u"%(tP["tensorChar"], self.unrollChar, 0, s) ) + vgpr(v+s-1), "gro%s%s_%u_s%u"%(tc, self.unrollChar, 0, s) ) for l in range(1, tP["nru"]): # l>0, s=0 totalStride += stride - if tP["tlu"] and kernel["DirectToVgpr%s"%tc] and lrvwOther >= 2 and not tluOther: - # DirectToVgpr + LocalReadVectorWidth>=2 + other side of TLU is false case, stride * lrvwOther is added every lrvwOther. + if dtvKInterval > 1: + # DirectToVgpr + k interval > 1 case, stride * dtvKInterval is added every dtvKInterval. # Add mod in mod != 0 case - totalStride = stride * (l - (l % lrvwOther)) + (l % lrvwOther) + totalStride = stride * (l - (l % dtvKInterval)) + (l % dtvKInterval) currStride = totalStride - prevStride prevStride = totalStride kStr += inst("_v_add_co_u32", vgpr(v+l*tP["glvw"]), self.vcc, currStride * bpeOffset, \ vgpr(v+(l-1)*tP["glvw"]), \ - "gro%s%s_%u_s%u + %s"%(tP["tensorChar"], self.unrollChar, l, 0, strideIdx) ) + "gro%s%s_%u_s%u + %s"%(tc, self.unrollChar, l, 0, strideIdx) ) # l>0, s>0 for s in range(1, tP["glvw"]): kStr += inst("_v_add_co_u32", vgpr(v+l*tP["glvw"]+s), self.vcc, \ 1, vgpr(v+l*tP["glvw"]+(s-1)), \ - "gro%s%s_%u_s%u"%(tP["tensorChar"], self.unrollChar, 0, s) ) + "gro%s%s_%u_s%u"%(tc, self.unrollChar, 0, s) ) else: kStr += inst("v_mov_b32", vgpr(v), \ - vgpr(tP["gpr"]["uReg"]), "gro%s%s_%u"%(tP["tensorChar"], self.unrollChar, 0) ) + vgpr(tP["gpr"]["uReg"]), "gro%s%s_%u"%(tc, self.unrollChar, 0) ) for l in range(1, tP["nru"]): totalStride += stride - if tP["tlu"] and kernel["DirectToVgpr%s"%tc] and lrvwOther >= 2 and not tluOther: - # DirectToVgpr + LocalReadVectorWidth>=2 case, stride * lrvwOther is added every lrvwOther. + if dtvKInterval > 1: + # DirectToVgpr + k interval > 1 case, stride * dtvKInterval is added every dtvKInterval. # Add mod in mod != 0 case - totalStride = stride * (l - (l % lrvwOther)) + (l % lrvwOther) + totalStride = stride * (l - (l % dtvKInterval)) + (l % dtvKInterval) currStride = totalStride - prevStride prevStride = totalStride kStr += inst("_v_add_co_u32", vgpr(v+l), self.vcc, currStride * bpeOffset, \ - vgpr(v+l-1), "gro%s%s_%u + %s"%(tP["tensorChar"], self.unrollChar, l, strideIdx) ) + vgpr(v+l-1), "gro%s%s_%u + %s"%(tc, self.unrollChar, l, strideIdx) ) #self.vgprPool.checkIn(tP["gpr"]["uReg"]) return "" if self.dontAppendCode else kStr @@ -6994,13 +7033,21 @@ def generateSrcStrForMFMA(self, kernel, tP, innerUnroll, vregSetIdx, vgprPerInpu m_or_u = u if kernel["DirectToVgpr%c"%tc] else m vgprBuffer_new = (m_or_u//numIterPerCoalescedRead)*numIterPerCoalescedRead vgprBuffer_new_offset = m_or_u%numIterPerCoalescedRead*innerUnroll*vgprPerInput + # DirectToVgpr + pack special case + # offset vgprBuffer_new + packDTV = self.packDTVA if tc == "A" else self.packDTVB + if packDTV: + # DTV + pack case, offset bufferIdx for local read packing instructions + numBi = kernel["LoopIters"] + vgprBuffer_new += vregSetIdx * numBi iui_new = (iui//numReadsIterCoalesced)*numReadsIterCoalesced iui_new_offset = iui%numReadsIterCoalesced*vgprPerInput ab_new = idxAB*vgprPerInput*numReadsIterCoalesced abStr = "Valu%c_X%u_I%u+%u+%u+%u" % (tc, vgprBuffer_new, iui_new, ab_new, vgprBuffer_new_offset, iui_new_offset) - if kernel["DirectToVgpr%c"%tc]: - # overwrite aStr/bStr for DirectToVgpr + packDTV = self.packDTVA if tP["isA"] else self.packDTVB + if kernel["DirectToVgpr%c"%tc] and not packDTV: + # overwrite aStr/bStr for DirectToVgpr (except for pack DTV case) ab_new += vregSetIdx * numVgprPerBlock + ( vgprBuffer_new * innerUnroll) * numVgprValuPerBlock abStr = "G2L%c+%u+%u" % (tc, ab_new, vgprBuffer_new_offset) diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index d602ccec7..d6897a5ed 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -2221,14 +2221,16 @@ def setGlobalLoadTileDimFractional(state, tc, depthU, glvwOrig): while grvw >= minGrvw: # Per instruction across the entire group: elementsLoadedPerInst = state["NumThreads"]*grvw + mik = 1 if (state["DirectToVgpr%s"%tc] and state["ProblemType"]["TLU%s"%tc]): - elementsLoadedPerInst //= state["MatrixInstK"] * state["LocalSplitU"] + mik = state["MatrixInstK"] * state["LocalSplitU"] // state["MIInputPerThread"] + elementsLoadedPerInst //= mik # LSC, LSP - #elements loaded along specified dim with each load if parDim >= elementsLoadedPerInst: # entire work-group can work on (part) of the same row # DirectToVgpr case, LSC is limited to elementsLoadedPerInst // (state["MatrixInstK"] * state["LocalSplitU"]) state["LSC%s"%tc] = elementsLoadedPerInst - state["LSP%s"%tc] = 1 if not (state["DirectToVgpr%s"%tc] and state["ProblemType"]["TLU%s"%tc]) else state["MatrixInstK"] * state["LocalSplitU"] + state["LSP%s"%tc] = mik state["NumLoadsCoalesced%s"%tc] = roundupRatio(parDim , state["LSC%s"%tc]) state["NumLoadsPerpendicular%s"%tc] = 1 else: @@ -2249,9 +2251,7 @@ def setGlobalLoadTileDimFractional(state, tc, depthU, glvwOrig): validElementsLoadedPerInst = state["LSC%s"%tc] * state["LSP%s"%tc] grvw //= 2 while grvw >= minGrvw: - elementsLoadedPerInst = state["NumThreads"]*grvw - if state["DirectToVgpr%s"%tc] and state["ProblemType"]["TLU%s"%tc]: - elementsLoadedPerInst //= state["MatrixInstK"] * state["LocalSplitU"] + elementsLoadedPerInst = state["NumThreads"]*grvw//mik if elementsLoadedPerInst < validElementsLoadedPerInst: break # Went too far, not enough load elements at this VW if state["LSC%s"%tc] % grvw == 0: @@ -2426,6 +2426,30 @@ def checkAndAssignWaveSeparateGlobalRead(state, tc): reject(state, "didn't support WaveSeparateGlobalRead when MacroTile is not multiple of wave %u in TLU%s" % (state["MacroTile%s"%tc], tc)) + ######################################## + # determine can we use VgprForLocalReadPacking + @staticmethod + def isVgprForLocalReadPackingDoable(state): + rejectComment = "" + doable = True + # MatrixInstruction only + if not state["EnableMatrixInstruction"]: + rejectComment = "VgprForLocalReadPacking is for MatrixInstruction only" + doable = False + # only for HasEccHalf + if not globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"]: + rejectComment = "VgprForLocalReadPacking is for EccHalf only" + doable = False + # only for SIA=3 + PLR>=1 + if not (state["ScheduleIterAlg"] == 3 and state["PrefetchLocalRead"] >= 1): + rejectComment = "VgprForLocalReadPacking is effective only fof SIA=3 and PLR>=1" + doable = False + # only for 1 or 2 byte input (numRegister < 1) + UnrollMajorLDSA or B is False + if not (state["ProblemType"]["DataType"].numRegisters() < 1 and (state["UnrollMajorLDSA"] == False or state["UnrollMajorLDSB"] == False)): + rejectComment = "VgprForLocalReadPacking is effective only fof 1 or 2 byte input + UnrollMajorLDSA or B =false" + doable = False + return doable, rejectComment + ######################################## # determine if current datatype can support DirectToVgpr @staticmethod @@ -2470,8 +2494,16 @@ def isDirectToVgprDoable(state, tc): if numBytes < 4: # Does not work with TLU = True and numBytes < 4 (not supported) if state["ProblemType"]["TLU%c"%tc]: - reject(state, "DirectToVgpr%c does not supports TLU%c = True + numByte < 4"%(tc, tc)) - return False + doable, _ = Solution.isVgprForLocalReadPackingDoable(state) + if numBytes * state["VectorWidth%s"%tc] >= 4 and doable: + # use pack logic (with v_perm) same as local read (only if VgprForLocalReadPacking is doable) + # numBytes * VW should be 4 or larger + # force VgprForLocalReadPacking + ClusterLocalRead + state["VgprForLocalReadPacking"] = True + state["ClusterLocalRead"] = True + else: + reject(state, "DirectToVgpr%c does not supports TLU%c = True + numByte < 4"%(tc, tc)) + return False # MIWaveGroup, MatrixInstBM,BN check # for A, MIWaveGroup[1] and MatrixInstBN should be 1 @@ -2855,6 +2887,10 @@ def ldsPaddingAuto(state, isa): assert(state["LdsPad%s"%tc] >= 0) + # DirectToVgpr case, set LdsPad to 0 + if state["DirectToVgpr%s"%tc]: + state["LdsPad%s"%tc] = 0 + # set LdsBlockSizePerPad = 0 if LdsPad is 0 if state["LdsPad%s"%tc] == 0: state["LdsBlockSizePerPad%s"%tc] = 0 @@ -4594,22 +4630,10 @@ def assignDerivedParameters(state): # reject check for VgprForLocalReadPacking if state["VgprForLocalReadPacking"]: - # MatrixInstruction only - if not state["EnableMatrixInstruction"]: - reject(state, "VgprForLocalReadPacking is for MatrixInstruction only") - return - # only for HasEccHalf - if not globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"]: - reject(state, "VgprForLocalReadPacking is for EccHalf only") - return - # only for SIA=3 + PLR>=1 - if not (state["ScheduleIterAlg"] == 3 and state["PrefetchLocalRead"] >= 1): - reject(state, "VgprForLocalReadPacking is effective only fof SIA=3 and PLR>=1") - return - # only for 1 or 2 byte input (numRegister < 1) + UnrollMajorLDSA or B is False - if not (state["ProblemType"]["DataType"].numRegisters() < 1 and (state["UnrollMajorLDSA"] == False or state["UnrollMajorLDSB"] == False)): - reject(state, "VgprForLocalReadPacking is effective only fof 1 or 2 byte input + UnrollMajorLDSA or B =false") - return + doable, rejectComment = Solution.isVgprForLocalReadPackingDoable(state) + if not doable: + reject(state, rejectComment) + return # reject check for ClusterLocalRead if state["ClusterLocalRead"]: @@ -4622,6 +4646,10 @@ def assignDerivedParameters(state): reject(state, "ClusterLocalRead does not support VectorWidth or VectorWidthB > MIInputPerThread") return + # change negative ExtraLatencyForLR to 0 for non DirectToVgpr + if state["ExtraLatencyForLR"] < 0 and not (state["DirectToVgprA"] or state["DirectToVgprB"]): + state["ExtraLatencyForLR"] = 0 + ######################################## # create a dictionary with booleans on whether to include parameter in name @staticmethod diff --git a/Tensile/Tests/extended/direct_to_vgpr/dtv_f8gemm.yaml b/Tensile/Tests/extended/direct_to_vgpr/dtv_f8gemm.yaml index 0f0b96e47..ecbbb4472 100644 --- a/Tensile/Tests/extended/direct_to_vgpr/dtv_f8gemm.yaml +++ b/Tensile/Tests/extended/direct_to_vgpr/dtv_f8gemm.yaml @@ -121,7 +121,226 @@ BenchmarkProblems: - ProblemSizes: - Exact: [ 508, 508, 1, 2048] + ######################################## + # F8SS NT - DTVA + DTL + ######################################## + - + - # ProblemType + OperationType: GEMM + DataType: F8 + DestDataType: S + ComputeDataType: S + HighPrecisionAccumulate: True + TransposeA: False + TransposeB: True + UseBeta: True + Batched: True + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - MatrixInstruction: + - [16, 16, 32, 1, 1, 4, 4, 4,1] # 256x64 + - [16, 16, 32, 1, 1, 8, 4, 4,1] # 512x64 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [4] + - AssertFree1ElementMultiple : [4] + - AssertSummationElementMultiple: [128] + - DepthU: [64,128] + - 1LDSBuffer: [0] + - LoopTail: [True] + - OptNoLoadLoop: [1] + - PrefetchGlobalRead: [1,2] + - PrefetchLocalRead: [1,2,3,5,9,17] + - ScheduleIterAlg: [3] + - StaggerU: [0] + - SourceSwap: [1] + #- TransposeLDS: [1] + - GlobalReadVectorWidth: [4,8] + - LocalReadVectorWidth: [4,8] + - VectorWidth: [4] + #- WaveSeparateGlobalReadB: [1] + - NumElementsPerBatchStore: [4] + - UseSgprForGRO: [0] + - DirectToVgprA: [1] + #- DirectToLdsA: [False, True] + - DirectToLdsB: [False, True] + #- NumLoadsCoalescedA: [1,2,4] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Exact: [ 508, 508, 1, 2048] + ######################################## + # F8SS NT - DTVB + DTL + ######################################## + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - MatrixInstruction: + - [16, 16, 32, 1, 1, 4, 4, 1, 4] # 64x256 + - [16, 16, 32, 1, 1, 4, 8, 1, 4] # 64x512 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [4] + - AssertFree1ElementMultiple : [4] + - AssertSummationElementMultiple: [128] + - DepthU: [64,128] + - 1LDSBuffer: [0] + - LoopTail: [True] + - OptNoLoadLoop: [1] + - PrefetchGlobalRead: [1,2] + - PrefetchLocalRead: [1,2,3,5,9,17] + - ScheduleIterAlg: [3] + - StaggerU: [0] + - SourceSwap: [1] + #- TransposeLDS: [1] + - GlobalReadVectorWidth: [4,8] + - LocalReadVectorWidth: [4,8] + - VectorWidth: [4] + #- WaveSeparateGlobalReadB: [1] + - NumElementsPerBatchStore: [4] + - UseSgprForGRO: [0] + - DirectToVgprB: [1] + - DirectToLdsA: [False, True] + #- DirectToLdsB: [False, True] + #- NumLoadsCoalescedA: [1,2,4] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Exact: [ 508, 508, 1, 2048] + ######################################## + # F8SS NN - DTVA + DTL + ######################################## + - + - # ProblemType + OperationType: GEMM + DataType: F8 + DestDataType: S + ComputeDataType: S + HighPrecisionAccumulate: True + TransposeA: False + TransposeB: False + UseBeta: True + Batched: True + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - MatrixInstruction: + - [16, 16, 32, 1, 1, 4, 4, 4,1] # 256x64 + - [16, 16, 32, 1, 1, 8, 4, 4,1] # 512x64 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [4] + - AssertFree1ElementMultiple : [4] + - AssertSummationElementMultiple: [128] + - DepthU: [64,128] + - 1LDSBuffer: [0] + - LoopTail: [True] + - OptNoLoadLoop: [1] + - PrefetchGlobalRead: [1,2] + - PrefetchLocalRead: [1,2,3,5,9,17] + - ScheduleIterAlg: [3] + - StaggerU: [0] + - SourceSwap: [1] + - TransposeLDS: [1] + - GlobalReadVectorWidth: [4,8] + - LocalReadVectorWidth: [4,8] + - VectorWidth: [4] + #- WaveSeparateGlobalReadB: [1] + - NumElementsPerBatchStore: [4] + - UseSgprForGRO: [0] + - DirectToVgprA: [1] + #- DirectToLdsA: [False, True] + - DirectToLdsB: [False, True] + #- NumLoadsCoalescedA: [1,2,4] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Exact: [ 508, 508, 1, 2048] + + + ######################################## + # F8SS TT - DTVB + DTL + ######################################## + - + - # ProblemType + OperationType: GEMM + DataType: F8 + DestDataType: S + ComputeDataType: S + HighPrecisionAccumulate: True + TransposeA: True + TransposeB: True + UseBeta: True + Batched: True + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - MatrixInstruction: + - [16, 16, 32, 1, 1, 4, 4, 1, 4] # 64x256 + - [16, 16, 32, 1, 1, 4, 8, 1, 4] # 64x512 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [4] + - AssertFree1ElementMultiple : [4] + - AssertSummationElementMultiple: [128] + - DepthU: [64,128] + - 1LDSBuffer: [0] + - LoopTail: [True] + - OptNoLoadLoop: [1] + - PrefetchGlobalRead: [1,2] + - PrefetchLocalRead: [1,2,3,5,9,17] + - ScheduleIterAlg: [3] + - StaggerU: [0] + - SourceSwap: [1] + - TransposeLDS: [1] + - GlobalReadVectorWidth: [4,8] + - LocalReadVectorWidth: [4,8] + - VectorWidth: [4] + #- WaveSeparateGlobalReadB: [1] + - NumElementsPerBatchStore: [4] + - UseSgprForGRO: [0] + - DirectToVgprB: [1] + - DirectToLdsA: [False, True] + #- DirectToLdsB: [False, True] + #- NumLoadsCoalescedA: [1,2,4] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Exact: [ 508, 508, 1, 2048] diff --git a/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml b/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml index b237842a3..7fe9b0028 100644 --- a/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml +++ b/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml @@ -354,7 +354,7 @@ BenchmarkProblems: - Range: [ [511], [511], [1], [2023, 24, 2047] ] ######################################## - # HHS NN - DTVB (+ DTL) + max load width for TailLoopp + VFLRP + # HHS NN - DTVB (+ DTL) + max load width for TailLoop + VFLRP ######################################## - - # ProblemType @@ -474,3 +474,263 @@ BenchmarkProblems: BenchmarkFinalParameters: - ProblemSizes: - Range: [ [511], [511], [1], [2023, 24, 2047] ] + + ######################################## + # HHS NN - DTVA (+ DTL) + max load width for TailLoop + VFLRP + ######################################## + - + - # ProblemType + OperationType: GEMM + DataType: H + DestDataType: H + ComputeDataType: S + HighPrecisionAccumulate: True + TransposeA: False + TransposeB: False + UseBeta: True + Batched: True + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - KernelLanguage: ["Assembly"] + - MinKForGSU: [64] + ForkParameters: + - MatrixInstruction: + - [16, 16, 16, 1, 1, 2, 4, 4,1] # 128x 64 + - [16, 16, 16, 1, 1, 4, 4, 2,1] # 128x 64 + - [16, 16, 16, 1, 1, 4, 4, 4,1] # 256x 64 + - [32, 32, 8, 1, 1, 2, 4, 4,1] # 256x128 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + - [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [8] + - AssertFree1ElementMultiple : [8] + - AssertSizeGreaterThan: [{}, {3: 192}] + - AssertSummationElementMultiple: [8, 64] + - DepthU: [32,64] + - 1LDSBuffer: [0] + - PrefetchGlobalRead: [1,2] + - PrefetchLocalRead: [1,3,5,9] + - ScheduleIterAlg: [3] + #- StaggerU: [0,32] + - SourceSwap: [1]#[0,1] + - TransposeLDS: [1] + - GlobalReadVectorWidth: [2,4] + - LocalReadVectorWidth: [4]#[4,8] + - VectorWidth: [2,4] + - UseSgprForGRO: [0] + - DirectToVgprA: [0,1] + #- DirectToLdsA: [False, True] + - DirectToLdsB: [False, True] + - NumLoadsCoalescedB: [1] + #- BufferLoad: [0,1] + - GlobalSplitU: [1,2] + - GlobalSplitUAlgorithm: ["MultipleBuffer"] + - VgprForLocalReadPacking: [1] + - ClusterLocalRead: [1] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Range: [ [504], [504], [1], [2024, 8, 2040] ] + - Range: [ [504], [504], [1], [200] ] + - Range: [ [504], [504], [1], [192] ] + + ######################################## + # HHS NT - DTVA (+ DTL) + max load width for TailLoop + VFLRP + ######################################## + - + - # ProblemType + OperationType: GEMM + DataType: H + DestDataType: H + ComputeDataType: S + HighPrecisionAccumulate: True + TransposeA: False + TransposeB: True + UseBeta: True + Batched: True + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - KernelLanguage: ["Assembly"] + - MinKForGSU: [64] + ForkParameters: + - MatrixInstruction: + - [16, 16, 16, 1, 1, 2, 4, 4,1] # 128x 64 + - [16, 16, 16, 1, 1, 4, 4, 2,1] # 128x 64 + - [16, 16, 16, 1, 1, 4, 4, 4,1] # 256x 64 + - [32, 32, 8, 1, 1, 2, 4, 4,1] # 256x128 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + - [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [8] + - AssertFree1ElementMultiple : [8] + - AssertSizeGreaterThan: [{}, {3: 192}] + - AssertSummationElementMultiple: [8, 64] + - DepthU: [32,64] + - 1LDSBuffer: [0] + - PrefetchGlobalRead: [1,2] + - PrefetchLocalRead: [1,3,5,9] + - ScheduleIterAlg: [3] + #- StaggerU: [0,32] + - SourceSwap: [1]#[0,1] + #- TransposeLDS: [1] + - GlobalReadVectorWidth: [2,4] + - LocalReadVectorWidth: [4]#[4,8] + - VectorWidth: [2,4] + - VectorWidthB: [2,4] + - UseSgprForGRO: [0] + - DirectToVgprA: [0,1] + #- DirectToLdsA: [False, True] + - DirectToLdsB: [False, True] + - NumLoadsCoalescedB: [1] + #- BufferLoad: [0,1] + - GlobalSplitU: [1,2] + - GlobalSplitUAlgorithm: ["MultipleBuffer"] + - VgprForLocalReadPacking: [1] + - ClusterLocalRead: [1] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Range: [ [504], [504], [1], [2024, 8, 2040] ] + - Range: [ [504], [504], [1], [200] ] + - Range: [ [504], [504], [1], [192] ] + + ######################################## + # HHS NT - DTVB (+ DTL) + max load width for TailLoop + VFLRP + ######################################## + - + - # ProblemType + OperationType: GEMM + DataType: H + DestDataType: H + ComputeDataType: S + HighPrecisionAccumulate: True + TransposeA: False + TransposeB: True + UseBeta: True + Batched: True + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - KernelLanguage: ["Assembly"] + - MinKForGSU: [64] + ForkParameters: + - MatrixInstruction: + #- [16, 16, 16, 1, 1, 4, 2, 1, 4] # 64x128 + - [16, 16, 16, 1, 1, 4, 4, 1, 2] # 64x128 + - [16, 16, 16, 1, 1, 4, 4, 1, 4] # 64x256 + - [32, 32, 8, 1, 1, 4, 2, 1, 4] # 128x256 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + - [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [8] + - AssertFree1ElementMultiple : [8] + - AssertSizeGreaterThan: [{}, {3: 192}] + - AssertSummationElementMultiple: [8, 64] + - DepthU: [32,64] + - 1LDSBuffer: [0] + - PrefetchGlobalRead: [1,2] + - PrefetchLocalRead: [1,3,5,9] + - ScheduleIterAlg: [3] + #- StaggerU: [0,32] + - SourceSwap: [1]#[0,1] + #- TransposeLDS: [1] + - GlobalReadVectorWidth: [2,4] + - LocalReadVectorWidth: [4]#[4,8] + - VectorWidth: [2,4] + - VectorWidthB: [2,4] + - UseSgprForGRO: [0] + - DirectToVgprB: [0,1] + - DirectToLdsA: [False, True] + #- DirectToLdsB: [False, True] + - NumLoadsCoalescedB: [1] + #- BufferLoad: [0,1] + #- GlobalSplitU: [1,2] + #- GlobalSplitUAlgorithm: ["MultipleBuffer"] + - VgprForLocalReadPacking: [1] + - ClusterLocalRead: [1] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Range: [ [504], [504], [1], [2024, 8, 2040] ] + - Range: [ [504], [504], [1], [200] ] + - Range: [ [504], [504], [1], [192] ] + + ######################################## + # HHS TT - DTVB (+ DTL) + max load width for TailLoop + VFLRP + ######################################## + - + - # ProblemType + OperationType: GEMM + DataType: H + DestDataType: H + ComputeDataType: S + HighPrecisionAccumulate: True + TransposeA: True + TransposeB: True + UseBeta: True + Batched: True + - + InitialSolutionParameters: + BenchmarkCommonParameters: + - EdgeType: ["ShiftPtr"] + - KernelLanguage: ["Assembly"] + - MinKForGSU: [64] + ForkParameters: + - MatrixInstruction: + #- [16, 16, 16, 1, 1, 4, 2, 1, 4] # 64x128 + - [16, 16, 16, 1, 1, 4, 4, 1, 2] # 64x128 + - [16, 16, 16, 1, 1, 4, 4, 1, 4] # 64x256 + - [32, 32, 8, 1, 1, 4, 2, 1, 4] # 128x256 + #- ThreadTile: + # - [ 2, 2 ] + - WorkGroup: + - [ 64, 1, 1 ] # only WG2 is effective for 9 parameter MI + - [ 64, 1, 2 ] # only WG2 is effective for 9 parameter MI + #- [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI + - AssertFree0ElementMultiple : [8] + - AssertFree1ElementMultiple : [8] + - AssertSizeGreaterThan: [{}, {3: 192}] + - AssertSummationElementMultiple: [8, 64] + - DepthU: [32,64] + - 1LDSBuffer: [0] + - PrefetchGlobalRead: [1,2] + - PrefetchLocalRead: [1,3,5,9] + - ScheduleIterAlg: [3] + #- StaggerU: [0,32] + - SourceSwap: [1]#[0,1] + - TransposeLDS: [1] + - GlobalReadVectorWidth: [2,4] + - LocalReadVectorWidth: [4]#[4,8] + - VectorWidth: [2,4] + - VectorWidthB: [2,4] + - UseSgprForGRO: [0] + - DirectToVgprB: [0,1] + - DirectToLdsA: [False, True] + #- DirectToLdsB: [False, True] + - NumLoadsCoalescedB: [1] + #- BufferLoad: [0,1] + #- GlobalSplitU: [1,2] + #- GlobalSplitUAlgorithm: ["MultipleBuffer"] + - VgprForLocalReadPacking: [1] + - ClusterLocalRead: [1] + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Range: [ [504], [504], [1], [2024, 8, 2040] ] + - Range: [ [504], [504], [1], [200] ] + - Range: [ [504], [504], [1], [192] ] + From ac1ca7bb8fdbaeab21f325996e10a3723b563c29 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Fri, 26 Jan 2024 01:00:09 +0900 Subject: [PATCH 40/51] Small fix for LdsPad auto (#1871) - fixed incorrect value assignment for autoAdjusted - set LdsBlockSizePerPadA or B = 0 if stride is not power of 2 --- Tensile/SolutionStructs.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index d6897a5ed..c84b1b4b3 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -2810,7 +2810,7 @@ def ldsPaddingAuto(state, isa): state["LdsPad%s"%tc] = 0 else: state["LdsPad%s"%tc] = vw - autoAdjusted["LdsPad%s"%tc] = autoCalcLBSPP + autoAdjusted["LdsPad%s"%tc] = autoCalcLP if state["EnableMatrixInstruction"]: # MI case @@ -2831,6 +2831,7 @@ def ldsPaddingAuto(state, isa): # if LRstrideLine is not power of 2, adjust ldsPad at each line (keep LRstride = 0) if LRstrideLine <= 0 or (LRstrideLine & (LRstrideLine - 1)) != 0: LRstride = 0 + state["LdsBlockSizePerPad%s"%tc] = 0 # force LdsBlockSizePerPad to 0 # auto calc for LBSPP if autoCalcLBSPP and LRstride > 0: state["LdsBlockSizePerPad%s"%tc] = max(int(2**(math.ceil(math.log(LRstride * numBytes, 2)))), 128) From a8d42d1875f2d10ea4f025a00b56dbfeb32b2677 Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Thu, 25 Jan 2024 14:12:58 -0700 Subject: [PATCH 41/51] Predicate for arithmetic intensity (#1850) --- HostLibraryTests/CMakeLists.txt | 1 + HostLibraryTests/Predicates_test.cpp | 68 ++++++++++++++++ Tensile/Common.py | 8 ++ Tensile/Contractions.py | 8 +- .../include/Tensile/ContractionProblem.hpp | 8 ++ .../Tensile/ContractionProblemPredicates.hpp | 77 +++++++++++++++++++ .../Serialization/ContractionPredicates.hpp | 14 ++++ .../Source/lib/source/ContractionProblem.cpp | 37 +++++++++ 8 files changed, 220 insertions(+), 1 deletion(-) create mode 100644 HostLibraryTests/Predicates_test.cpp diff --git a/HostLibraryTests/CMakeLists.txt b/HostLibraryTests/CMakeLists.txt index 6a67cf7c1..73a77f3cc 100644 --- a/HostLibraryTests/CMakeLists.txt +++ b/HostLibraryTests/CMakeLists.txt @@ -131,6 +131,7 @@ set(test_sources ${test_sources} DataTypes_test.cpp EmbeddedData_test.cpp KernelArguments_test.cpp + Predicates_test.cpp ProjectedPerformance_test.cpp DecisionTree_test.cpp TensorDescriptor_test.cpp diff --git a/HostLibraryTests/Predicates_test.cpp b/HostLibraryTests/Predicates_test.cpp new file mode 100644 index 000000000..d2f2cd839 --- /dev/null +++ b/HostLibraryTests/Predicates_test.cpp @@ -0,0 +1,68 @@ +/******************************************************************************* + * + * MIT License + * + * Copyright (C) 2023 Advanced Micro Devices, Inc. All rights reserved. + * + * Permission is hereby granted, free of charge, to any person obtaining a copy + * of this software and associated documentation files (the "Software"), to deal + * in the Software without restriction, including without limitation the rights + * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell + * copies of the Software, and to permit persons to whom the Software is + * furnished to do so, subject to the following conditions: + * + * The above copyright notice and this permission notice shall be included in + * all copies or substantial portions of the Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE + * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE + * SOFTWARE. + * + *******************************************************************************/ + +#include + +#include + +TEST(Predicates, ArithmeticIntensity) +{ + using namespace Tensile; + + ContractionProblem a = ContractionProblem::GEMM( + false, true, 1000, 1500, 500, 2000, 2000, 2000, 3.0, false, 1); // 88.4 + ContractionProblem b = ContractionProblem::GEMM( + false, true, 500, 1000, 1000, 2000, 2000, 2000, 0.0, false, 5); // 125 + ContractionProblem c = ContractionProblem::GEMM( + false, true, 2000, 100, 2000, 2000, 2000, 2000, 1.0, false, 10); // 43.5 + ContractionProblem d = ContractionProblem::GEMM( + false, true, 2000, 2000, 450, 2000, 2000, 2000, 2.0, false, 1); // 92.04 + + auto pg1 = std::make_shared(100); + auto pg2 = std::make_shared(75); + auto pl1 = std::make_shared(100); + auto pl2 = std::make_shared(75); + + EXPECT_EQ(false, (*pg1)(a)); + EXPECT_EQ(true, (*pg2)(a)); + EXPECT_EQ(true, (*pl1)(a)); + EXPECT_EQ(false, (*pl2)(a)); + + EXPECT_EQ(true, (*pg1)(b)); + EXPECT_EQ(true, (*pg2)(b)); + EXPECT_EQ(false, (*pl1)(b)); + EXPECT_EQ(false, (*pl2)(b)); + + EXPECT_EQ(false, (*pg1)(c)); + EXPECT_EQ(false, (*pg2)(c)); + EXPECT_EQ(true, (*pl1)(c)); + EXPECT_EQ(true, (*pl2)(c)); + + EXPECT_EQ(false, (*pg1)(d)); + EXPECT_EQ(true, (*pg2)(d)); + EXPECT_EQ(true, (*pl1)(d)); + EXPECT_EQ(false, (*pl2)(d)); +} diff --git a/Tensile/Common.py b/Tensile/Common.py index 3a269f461..50fb00465 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -843,6 +843,12 @@ def getArchitectureName(gfxName): "AssertSizeLessThan": -1, "AssertSizeMultiple": -1, + # Assertions that require arithmetic intensity to be specified value. + # Arithmetic intensity measures the ratio of computation to memory bandwidth required for a problem. + # These predicates can be used to adjust solution selection compute-bound or memory-bound problems. + "AssertAIGreaterThanEqual": -1, + "AssertAILessThanEqual": -1, + #Assert values for alpha and beta "AssertBetaValue": [False, 1, -1], "AssertAlphaValue": [False, 1, -1], @@ -1493,6 +1499,8 @@ def getArchitectureName(gfxName): {"AssertSizeGreaterThan": [ {} ] }, {"AssertSizeMultiple": [ {} ] }, {"AssertSizeLessThan": [ {} ] }, + {"AssertAIGreaterThanEqual": [ -1 ] }, + {"AssertAILessThanEqual": [ -1 ] }, {"AssertAlphaValue": [ False ]}, {"AssertBetaValue": [ False ]}, {"AssertCEqualsD": [ False ]}, diff --git a/Tensile/Contractions.py b/Tensile/Contractions.py index 7176fccd1..79e8f160d 100644 --- a/Tensile/Contractions.py +++ b/Tensile/Contractions.py @@ -317,7 +317,13 @@ def FromOriginalKeyPair(cls, pair): if key == "AssertSizeMultiple": return extractDimPredicate(cls, key, value, "SizeMultiple") - #Alpha and beta value assertions + # Arithmetic intensity assertions + if key == "AssertAIGreaterThanEqual": + return cls("AIGreaterThanEqual", value=value) if value > 0 else None + if key == "AssertAILessThanEqual": + return cls("AILessThanEqual", value=value) if value > 0 else None + + # Alpha and beta value assertions if key == "AssertAlphaValue": return cls("AlphaValue", value=str(value)) if value != False else None if key == "AssertBetaValue": diff --git a/Tensile/Source/lib/include/Tensile/ContractionProblem.hpp b/Tensile/Source/lib/include/Tensile/ContractionProblem.hpp index 01b2a049f..c0db8cd3d 100644 --- a/Tensile/Source/lib/include/Tensile/ContractionProblem.hpp +++ b/Tensile/Source/lib/include/Tensile/ContractionProblem.hpp @@ -508,6 +508,11 @@ namespace Tensile return m_cEqualsD; } + double arithmeticIntensity() const + { + return m_arithmeticIntensity; + } + void setAlphaType(DataType type) { m_alphaType = type; @@ -861,6 +866,8 @@ namespace Tensile KernelLanguage m_kernelLanguage = KernelLanguage::Any; PerformanceMetric m_performanceMetric = PerformanceMetric::DeviceEfficiency; + double m_arithmeticIntensity; + DataType m_alphaType = DataType::None; // if not assigned, will follow d-type DataType m_betaType = DataType::None; // for bwd-compatible @@ -897,6 +904,7 @@ namespace Tensile void normalize(); void consistencyCheck() const; + void calcArithmeticIntensity(); void getIndexNames(std::string& aNames, std::string& bNames, diff --git a/Tensile/Source/lib/include/Tensile/ContractionProblemPredicates.hpp b/Tensile/Source/lib/include/Tensile/ContractionProblemPredicates.hpp index 140341a8f..4a64215bf 100644 --- a/Tensile/Source/lib/include/Tensile/ContractionProblemPredicates.hpp +++ b/Tensile/Source/lib/include/Tensile/ContractionProblemPredicates.hpp @@ -920,6 +920,83 @@ namespace Tensile } }; + struct AIGreaterThanEqual + : public Predicate_CRTP + { + enum + { + HasIndex = false, + HasValue = true + }; + + double value; + + AIGreaterThanEqual() = default; + AIGreaterThanEqual(double value) + : value(value) + { + } + + static std::string Type() + { + return "AIGreaterThanEqual"; + } + + virtual bool operator()(ContractionProblem const& problem) const override + { + return problem.arithmeticIntensity() >= value; + } + + virtual bool debugEval(ContractionProblem const& problem, + std::ostream& stream) const override + { + bool rv = (*this)(problem); + + stream << *this << ": (" << problem.arithmeticIntensity() << " >= " << value + << ") == " << rv; + + return rv; + } + }; + + struct AILessThanEqual : public Predicate_CRTP + { + enum + { + HasIndex = false, + HasValue = true + }; + + double value; + + AILessThanEqual() = default; + AILessThanEqual(double value) + : value(value) + { + } + + static std::string Type() + { + return "AILessThanEqual"; + } + + virtual bool operator()(ContractionProblem const& problem) const override + { + return problem.arithmeticIntensity() <= value; + } + + virtual bool debugEval(ContractionProblem const& problem, + std::ostream& stream) const override + { + bool rv = (*this)(problem); + + stream << *this << ": (" << problem.arithmeticIntensity() << " <= " << value + << ") == " << rv; + + return rv; + } + }; + struct AlphaValue : public Predicate_CRTP { enum diff --git a/Tensile/Source/lib/include/Tensile/Serialization/ContractionPredicates.hpp b/Tensile/Source/lib/include/Tensile/Serialization/ContractionPredicates.hpp index aadacd1d9..3cefdee27 100644 --- a/Tensile/Source/lib/include/Tensile/Serialization/ContractionPredicates.hpp +++ b/Tensile/Source/lib/include/Tensile/Serialization/ContractionPredicates.hpp @@ -75,6 +75,8 @@ namespace Tensile Base::template Pair(), Base::template Pair(), Base::template Pair(), + Base::template Pair(), + Base::template Pair(), Base::template Pair(), Base::template Pair(), Base::template Pair(), @@ -226,6 +228,18 @@ namespace Tensile { }; + template + struct MappingTraits + : public AutoMappingTraits + { + }; + + template + struct MappingTraits + : public AutoMappingTraits + { + }; + template struct MappingTraits : public AutoMappingTraits diff --git a/Tensile/Source/lib/source/ContractionProblem.cpp b/Tensile/Source/lib/source/ContractionProblem.cpp index 8c3f409e8..e42bfaf51 100644 --- a/Tensile/Source/lib/source/ContractionProblem.cpp +++ b/Tensile/Source/lib/source/ContractionProblem.cpp @@ -706,6 +706,7 @@ namespace Tensile m_beta); // Set enum using beta to potentially allow for faster solutions consistencyCheck(); normalize(); + calcArithmeticIntensity(); } size_t ContractionProblem::toAPos(size_t idx) const @@ -1048,6 +1049,42 @@ namespace Tensile TENSILE_ASSERT_EXC(DataTypeInfo::Get(m_d.dataType()).isComplex); } + void ContractionProblem::calcArithmeticIntensity() + { + size_t problemSize = 1; + for(size_t i = 0; i < m_problemSizes.size(); ++i) + { + problemSize *= m_problemSizes[i]; + } + double gflop = 2 * problemSize * 1e-9; + + size_t aSize = 1; + for(size_t i = 0; i < m_a.dimensions(); ++i) + { + aSize *= m_a.sizes()[i]; + } + size_t bSize = 1; + for(size_t i = 0; i < m_b.dimensions(); ++i) + { + bSize *= m_b.sizes()[i]; + } + size_t cSize = 1; + for(size_t i = 0; i < m_c.dimensions(); ++i) + { + cSize *= m_c.sizes()[i]; + } + if(m_beta != 0) // If problem includes beta, update gflops and gbytes + { + gflop += 2 * cSize * 1e-9; // Include (+ beta * C) in gflops + cSize *= 2; // Include read C and write D in gbytes + } + double gbyte + = (aSize * m_a.elementBytes() + bSize * m_b.elementBytes() + cSize * m_c.elementBytes()) + * 1e-9; + + m_arithmeticIntensity = gflop / gbyte; + } + size_t ContractionProblem::freeSizeA(size_t idx) const { return m_freeSizesA.at(idx); From 614893f7976459e4d5a75bfd5f1339f2b665cd44 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Sat, 27 Jan 2024 01:11:44 +0900 Subject: [PATCH 42/51] Skip DTV, DTL, LSU+MFMA tests for gfx908 (#1873) --- .../extended/direct_to_lds/dtl_hgemm.yaml | 2 +- .../extended/direct_to_lds/dtl_sgemm.yaml | 2 +- .../direct_to_lds/dtl_tsgr_hgemm.yaml | 2 +- .../direct_to_lds/dtl_tsgr_sgemm.yaml | 2 +- .../extended/direct_to_vgpr/dtv_hgemm.yaml | 2 +- .../extended/direct_to_vgpr/dtv_igemm.yaml | 2 +- .../local_split_u/cgemm_lsu_mfma.yaml | 4 ++-- .../local_split_u/hgemm_lsu_mfma.yaml | 6 +++--- .../local_split_u/hgemm_lsu_mfma_a1b0.yaml | 2 +- .../local_split_u/igemm_lsu_mfma.yaml | 20 +++++++++---------- .../local_split_u/sgemm_lsu_mfma.yaml | 10 +++++----- 11 files changed, 27 insertions(+), 27 deletions(-) diff --git a/Tensile/Tests/extended/direct_to_lds/dtl_hgemm.yaml b/Tensile/Tests/extended/direct_to_lds/dtl_hgemm.yaml index 118a86f7a..50eff564a 100644 --- a/Tensile/Tests/extended/direct_to_lds/dtl_hgemm.yaml +++ b/Tensile/Tests/extended/direct_to_lds/dtl_hgemm.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 diff --git a/Tensile/Tests/extended/direct_to_lds/dtl_sgemm.yaml b/Tensile/Tests/extended/direct_to_lds/dtl_sgemm.yaml index 700bfb4e3..394eeb1aa 100644 --- a/Tensile/Tests/extended/direct_to_lds/dtl_sgemm.yaml +++ b/Tensile/Tests/extended/direct_to_lds/dtl_sgemm.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 diff --git a/Tensile/Tests/extended/direct_to_lds/dtl_tsgr_hgemm.yaml b/Tensile/Tests/extended/direct_to_lds/dtl_tsgr_hgemm.yaml index 449b59a2d..9d8426550 100644 --- a/Tensile/Tests/extended/direct_to_lds/dtl_tsgr_hgemm.yaml +++ b/Tensile/Tests/extended/direct_to_lds/dtl_tsgr_hgemm.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 diff --git a/Tensile/Tests/extended/direct_to_lds/dtl_tsgr_sgemm.yaml b/Tensile/Tests/extended/direct_to_lds/dtl_tsgr_sgemm.yaml index c11e3b07e..7257efac7 100644 --- a/Tensile/Tests/extended/direct_to_lds/dtl_tsgr_sgemm.yaml +++ b/Tensile/Tests/extended/direct_to_lds/dtl_tsgr_sgemm.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 diff --git a/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml b/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml index 7fe9b0028..5cd2ea016 100644 --- a/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml +++ b/Tensile/Tests/extended/direct_to_vgpr/dtv_hgemm.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 diff --git a/Tensile/Tests/extended/direct_to_vgpr/dtv_igemm.yaml b/Tensile/Tests/extended/direct_to_vgpr/dtv_igemm.yaml index b8d26d029..f29b9103b 100644 --- a/Tensile/Tests/extended/direct_to_vgpr/dtv_igemm.yaml +++ b/Tensile/Tests/extended/direct_to_vgpr/dtv_igemm.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx940, skip-gfx941, skip-gfx942, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx940, skip-gfx941, skip-gfx942, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 diff --git a/Tensile/Tests/extended/local_split_u/cgemm_lsu_mfma.yaml b/Tensile/Tests/extended/local_split_u/cgemm_lsu_mfma.yaml index 162a827a4..44693d58a 100644 --- a/Tensile/Tests/extended/local_split_u/cgemm_lsu_mfma.yaml +++ b/Tensile/Tests/extended/local_split_u/cgemm_lsu_mfma.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 @@ -112,7 +112,7 @@ BenchmarkProblems: #- AssertFree1ElementMultiple: [1,2] - PrefetchLocalRead: [3,5,9] - GlobalSplitU: [1,4] - - GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - GlobalSplitUAlgorithm: ["SingleBuffer"]#["SingleBuffer","MultipleBuffer"] - DepthU: [16]#[16,32]#[ 8, 16 ] #- StoreVectorWidth: [1,2] - VectorWidth: [1,2] diff --git a/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma.yaml b/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma.yaml index 724b5fbfe..f04cbf8c7 100644 --- a/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma.yaml +++ b/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 @@ -148,7 +148,7 @@ BenchmarkProblems: - AssertSummationElementMultiple: [2] - DepthU: [32,64,128]#[8,16,32] - GlobalSplitU: [1,4] - - GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - GlobalSplitUAlgorithm: ["SingleBuffer"]#["SingleBuffer","MultipleBuffer"] - 1LDSBuffer: [0] - LoopTail: [True] - OptNoLoadLoop: [1] @@ -216,7 +216,7 @@ BenchmarkProblems: - AssertSummationElementMultiple: [2] - DepthU: [32,64,128]#[8,16,32] - GlobalSplitU: [1,4] - #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - GlobalSplitUAlgorithm: ["SingleBuffer"]#["SingleBuffer","MultipleBuffer"] - 1LDSBuffer: [0] - LoopTail: [True] - OptNoLoadLoop: [1] diff --git a/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma_a1b0.yaml b/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma_a1b0.yaml index 519e9d3a5..18a0c0558 100644 --- a/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma_a1b0.yaml +++ b/Tensile/Tests/extended/local_split_u/hgemm_lsu_mfma_a1b0.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 diff --git a/Tensile/Tests/extended/local_split_u/igemm_lsu_mfma.yaml b/Tensile/Tests/extended/local_split_u/igemm_lsu_mfma.yaml index fcf44d03d..5c8338764 100644 --- a/Tensile/Tests/extended/local_split_u/igemm_lsu_mfma.yaml +++ b/Tensile/Tests/extended/local_split_u/igemm_lsu_mfma.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx940, skip-gfx941, skip-gfx942, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx940, skip-gfx941, skip-gfx942, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 @@ -54,7 +54,7 @@ BenchmarkProblems: - AssertSummationElementMultiple: [2] - DepthU: [32,64,128]#[8,16,32] - GlobalSplitU: [1,4] - #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - GlobalSplitUAlgorithm: ["SingleBuffer"]#["SingleBuffer","MultipleBuffer"] - 1LDSBuffer: [0] - LoopTail: [True] - OptNoLoadLoop: [1] @@ -124,7 +124,7 @@ BenchmarkProblems: - UseSgprForGRO: [0] #- BufferLoad: [0,1] #- BufferStore: [0,1] - - VgprForLocalReadPacking: [0,1] + - VgprForLocalReadPacking: [1]#[0,1] - ClusterLocalRead: [0,1] BenchmarkJoinParameters: BenchmarkFinalParameters: @@ -229,7 +229,7 @@ BenchmarkProblems: - AssertSummationElementMultiple: [2] - DepthU: [32,64,128]#[8,16,32] - GlobalSplitU: [1,4] - #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - GlobalSplitUAlgorithm: ["SingleBuffer"]#["SingleBuffer","MultipleBuffer"] - 1LDSBuffer: [0] - LoopTail: [True] - OptNoLoadLoop: [1] @@ -249,7 +249,7 @@ BenchmarkProblems: #- BufferLoad: [0,1] #- BufferStore: [0,1] - TransposeLDS: [1] - - LocalReadVectorWidth: [-1,8] + - LocalReadVectorWidth: [-1]#[-1,8] BenchmarkJoinParameters: BenchmarkFinalParameters: - ProblemSizes: @@ -285,7 +285,7 @@ BenchmarkProblems: - AssertSummationElementMultiple: [2] - DepthU: [32,64,128]#[8,16,32] - GlobalSplitU: [1,4] - #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - GlobalSplitUAlgorithm: ["SingleBuffer"]#["SingleBuffer","MultipleBuffer"] - 1LDSBuffer: [0] - LoopTail: [True] - OptNoLoadLoop: [1] @@ -305,9 +305,9 @@ BenchmarkProblems: #- BufferLoad: [0,1] #- BufferStore: [0,1] - TransposeLDS: [1] - - LocalReadVectorWidth: [-1,8] + - LocalReadVectorWidth: [-1]#[-1,8] - DirectToVgprB: [0,1] - - VgprForLocalReadPacking: [0,1] + - VgprForLocalReadPacking: [1]#[0,1] - ClusterLocalRead: [0,1] BenchmarkJoinParameters: BenchmarkFinalParameters: @@ -360,7 +360,7 @@ BenchmarkProblems: - AssertSummationElementMultiple: [2] - DepthU: [32,64,128]#[8,16,32] - GlobalSplitU: [1,4] - #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - GlobalSplitUAlgorithm: ["SingleBuffer"]#["SingleBuffer","MultipleBuffer"] - 1LDSBuffer: [0] - LoopTail: [True] - OptNoLoadLoop: [1] @@ -380,7 +380,7 @@ BenchmarkProblems: #- BufferLoad: [0,1] #- BufferStore: [0,1] - TransposeLDS: [1] - - LocalReadVectorWidth: [-1,8] + - LocalReadVectorWidth: [-1]#[-1,8] BenchmarkJoinParameters: BenchmarkFinalParameters: - ProblemSizes: diff --git a/Tensile/Tests/extended/local_split_u/sgemm_lsu_mfma.yaml b/Tensile/Tests/extended/local_split_u/sgemm_lsu_mfma.yaml index 3a0fc9e25..eea612abe 100644 --- a/Tensile/Tests/extended/local_split_u/sgemm_lsu_mfma.yaml +++ b/Tensile/Tests/extended/local_split_u/sgemm_lsu_mfma.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 @@ -93,7 +93,7 @@ BenchmarkProblems: - [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI - DepthU: [16,32] - GlobalSplitU: [1,4] - - GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - GlobalSplitUAlgorithm: ["SingleBuffer"]#["SingleBuffer","MultipleBuffer"] - GlobalSplitUWorkGroupMappingRoundRobin: [False] - GlobalSplitUSummationAssignmentRoundRobin: [True] - 1LDSBuffer: [0] @@ -146,7 +146,7 @@ BenchmarkProblems: - [ 64, 1, 4 ] # only WG2 is effective for 9 parameter MI - DepthU: [16] - GlobalSplitU: [1,4] - #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] + - GlobalSplitUAlgorithm: ["MultipleBuffer"]#["SingleBuffer","MultipleBuffer"] #- GlobalSplitUWorkGroupMappingRoundRobin: [False] #- GlobalSplitUSummationAssignmentRoundRobin: [True] - 1LDSBuffer: [0] @@ -329,8 +329,8 @@ BenchmarkProblems: - DepthU: [16,32] #- GlobalSplitU: [1,2] #- GlobalSplitUAlgorithm: ["SingleBuffer","MultipleBuffer"] - - GlobalSplitUWorkGroupMappingRoundRobin: [False] - - GlobalSplitUSummationAssignmentRoundRobin: [True] + #- GlobalSplitUWorkGroupMappingRoundRobin: [False] + #- GlobalSplitUSummationAssignmentRoundRobin: [True] - 1LDSBuffer: [0] - LdsBlockSizePerPadA: [-1] - LdsBlockSizePerPadB: [-1] From 5d20869a31332ea2f4a100dadf568518ba108e66 Mon Sep 17 00:00:00 2001 From: mahmoodw <44450175+mahmoodw@users.noreply.github.com> Date: Mon, 29 Jan 2024 10:39:57 -0700 Subject: [PATCH 43/51] Adding option of rotating buffers for timing with cache eviction (#1848) --------- Co-authored-by: mahmoodw --- Tensile/ClientWriter.py | 2 + Tensile/Common.py | 23 ++++ Tensile/Source/client/main.cpp | 116 ++++++++++++++++--- Tensile/Source/lib/include/Tensile/Utils.hpp | 21 ++++ Tensile/Tests/pre_checkin/sgemm_asm_nn.yaml | 1 + Tensile/Tests/pre_checkin/sgemm_asm_nt.yaml | 1 + 6 files changed, 146 insertions(+), 18 deletions(-) diff --git a/Tensile/ClientWriter.py b/Tensile/ClientWriter.py index 49f8a2461..3414a818f 100644 --- a/Tensile/ClientWriter.py +++ b/Tensile/ClientWriter.py @@ -451,6 +451,8 @@ def param(key, value): param("num-syncs-per-benchmark", globalParameters["SyncsPerBenchmark"]) param("use-gpu-timer", globalParameters["KernelTime"]) param("hardware-monitor", globalParameters["HardwareMonitor"]) + param("flush-count", globalParameters["FlushCount"]) + param("flush-memory-size", globalParameters["FlushMemorySize"]) if convValidation: param("convolution-vs-contraction", globalParameters["ConvolutionVsContraction"]) param("sleep-percent", globalParameters["SleepPercent"]) diff --git a/Tensile/Common.py b/Tensile/Common.py index 50fb00465..0d957c9ce 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -69,6 +69,29 @@ globalParameters["SyncsPerBenchmark"] = 1 # how iterations of the stream synchronization for-loop to do per benchmark data point globalParameters["EnqueuesPerSync"] = 1 # how many solution enqueues to perform per synchronization globalParameters["SleepPercent"] = 300 # how long to sleep after every data point: 25 means 25% of solution time. Sleeping lets gpu cool down more. +globalParameters["FlushCount"] = 1 # Number of copies of arrays to allocate for cache flushing in timing code. + # Functions are called iters times in a timing loop. + # If the problem memory footprint is small enough, then arrays will be cached. + # flush_count can be used to prevent caching. + # For example, for sgemm with transA=transB=N: + # problem_memory_footprint = (m*k + k*n + m*n) * sizeof(float). + # To flush arrays before reusing set: + # flush_count >= 1 + cache_size / problem_memory_footprint + # Note that in the calculation of flush_count any padding from leading + # dimensions are not loaded to cache and not included in the problem_memory_footprint. + # If you specify flush_count you cannot also specify flush_memory_size) +globalParameters["FlushMemorySize"] = 0 # Bytes of memory that will be occupied by arrays. Used only in timing code for cache flushing. Set to greater than + # cache size, so that arrays are flushed from cache before they are reused. When the size of arrays (the problem_memory_footprint) + # is smaller than flush_memory_size, then flush_count copies of arrays are allocated where: + # flush_count = flush_memory_size / problem_memory_footprint. + # For sgemm with transA=transB=N + # problem_memory_footprint = (m*k + k*n + m*n) * sizeof(float). Note that any padding from leading + # dimensions are not loaded to cache and not included in the problem_memory_footprint. + # If you specify flush_memory_size you cannot also specify flush_count) + # Also note that Tensile allocates enough memory once at setup to accommodate + # the largest problem. Similarly, the largest problem will be used to calculate flush_count. + # Configs with largely contrasting sizes may not guarantee cache eviction for the smaller problems + # validation globalParameters["NumElementsToValidate"] = 128 # number of elements to validate, 128 will be evenly spaced out (with prime number stride) across C tensor globalParameters["BoundsCheck"] = 0 # Bounds check diff --git a/Tensile/Source/client/main.cpp b/Tensile/Source/client/main.cpp index dd1f0641a..792db82b2 100644 --- a/Tensile/Source/client/main.cpp +++ b/Tensile/Source/client/main.cpp @@ -166,6 +166,28 @@ namespace Tensile ("use-gpu-timer", po::value()->default_value(true), "Use GPU timer") ("sleep-percent", po::value()->default_value(0), "Sleep percentage") ("hardware-monitor", po::value()->default_value(true), "Use hardware monitor.") + ("flush-count", po::value()->default_value(1), "Number of copies of arrays to allocate for cache flushing in timing code." + " Functions are called iters times in a timing loop." + " If the problem memory footprint is small enough, then arrays will be cached." + " flush_count can be used to prevent caching." + " For example, for sgemm with transA=transB=N:" + " problem_memory_footprint = (m*k + k*n + m*n) * sizeof(float)." + " To flush arrays before reusing set:" + " flush_count >= 1 + cache_size / problem_memory_footprint" + " Note that in the calculation of flush_count any padding from leading" + " dimensions are not loaded to cache and not included in the problem_memory_footprint." + " If you specify flush_count you cannot also specify flush_memory_size") + ("flush-memory-size", po::value()->default_value(0), "Used only in timing code for cache flushing. Set to greater than" + " cache size, so that arrays are flushed from cache before they are reused. When the size of arrays (the problem_memory_footprint)" + " is smaller than flush_memory_size, then flush_count copies of arrays are allocated where:" + " flush_count = flush_memory_size / problem_memory_footprint." + " For sgemm with transA=transB=N" + " problem_memory_footprint = (m*k + k*n + m*n) * sizeof(float). Note that any padding from leading" + " dimensions are not loaded to cache and not included in the problem_memory_footprint." + " If you specify flush_memory_size you cannot also specify flush_count." + " Also note that Tensile allocates enough memory once at setup to accommodate" + " the largest problem. Similarly, the largest problem will be used to calculate flush_count." + " Configs with largely contrasting sizes may not guarantee cache eviction for the smaller problems") ("perf-l2-read-hits", po::value()->default_value(0.0), "L2 read hits") ("perf-l2-write-hits", po::value()->default_value(0.5), "L2 write hits") @@ -470,6 +492,48 @@ namespace Tensile } // namespace Client } // namespace Tensile +size_t calculate_flush_count(size_t arg_flush_count, + size_t arg_flush_memory_size, + Tensile::Client::ClientProblemFactory const& problemFactory) +{ + size_t default_arg_flush_count = 1; + size_t default_arg_flush_memory_size = 0; + size_t flush_count = default_arg_flush_count; + + size_t cached_size = 0; + + for(auto const& problem : problemFactory.problems()) + cached_size = std::max( + cached_size, + problem.a().sizes()[0] * problem.a().sizes()[1] * problem.a().elementBytes() + + problem.b().sizes()[0] * problem.b().sizes()[1] * problem.b().elementBytes() + + problem.c().sizes()[0] * problem.c().sizes()[1] * problem.c().elementBytes()); + + if(arg_flush_count != default_arg_flush_count + && arg_flush_memory_size != default_arg_flush_memory_size) + { + std::cout << "Tensile WARNING: cannot set both flush_count and flush_memory_size" + << std::endl; + std::cout << "Tensile WARNING: using flush_count = " << arg_flush_count << std::endl; + flush_count = arg_flush_count; + } + else if(arg_flush_count != default_arg_flush_count) + { + flush_count = arg_flush_count; + + std::cout << "flush_memory_size = "; + Tensile::print_memory_size(flush_count * cached_size); + std::cout << std::endl; + } + else if(arg_flush_memory_size != default_arg_flush_memory_size) + { + flush_count = 1 + (arg_flush_memory_size - 1) / cached_size; + + std::cout << "flush_count = " << flush_count << std::endl; + } + return flush_count; +} + int main(int argc, const char* argv[]) { using namespace Tensile; @@ -522,20 +586,28 @@ int main(int argc, const char* argv[]) size_t maxWorkspaceSizeLimit = args["max-workspace-size"].as(); size_t maxWorkspaceSize = getMaxWorkspace(library, hardware, args, problems, firstProblemIdx, lastProblemIdx); - maxWorkspaceSize = std::min(maxWorkspaceSize, maxWorkspaceSizeLimit); - - auto dataInit = DataInitialization::Get(args, problemFactory, maxWorkspaceSize); + maxWorkspaceSize = std::min(maxWorkspaceSize, maxWorkspaceSizeLimit); + size_t flush_count = args["flush-count"].as(); + size_t flush_memory_size = args["flush-memory-size"].as(); + std::vector> dataInit; auto solutionIterator = SolutionIterator::Default(library, hardware, args); MetaRunListener listeners; - listeners.addListener(dataInit); + flush_count = calculate_flush_count(flush_count, flush_memory_size, problemFactory); + + for(size_t i = 0; i < flush_count; i++) + { + dataInit.push_back(DataInitialization::Get(args, problemFactory, maxWorkspaceSize)); + listeners.addListener(dataInit[i]); + } + listeners.addListener(solutionIterator); listeners.addListener(std::make_shared(args)); if(runKernels) { - listeners.addListener(std::make_shared(args, dataInit)); + listeners.addListener(std::make_shared(args, dataInit[0])); listeners.addListener(std::make_shared(args, *hardware)); listeners.addListener(std::make_shared(args)); } @@ -572,7 +644,7 @@ int main(int argc, const char* argv[]) for(int problemIdx = firstProblemIdx; problemIdx <= lastProblemIdx; problemIdx++) { auto& problem = problems[problemIdx]; - problem.setWorkspaceSize(dataInit->workspaceSize()); + problem.setWorkspaceSize(dataInit[0]->workspaceSize()); reporters->report(ResultKey::ProblemIndex, problemIdx); reporters->report(ResultKey::ProblemProgress, @@ -599,12 +671,17 @@ int main(int argc, const char* argv[]) { while(listeners.needMoreRunsInSolution()) { - auto inputs = dataInit->prepareGPUInputs(problem); - - auto kernels = solution->solve(problem, *inputs, *hardware); + std::vector> inputs; + std::vector> kernels; + for(size_t i = 0; i < flush_count; i++) + { + inputs.push_back(dataInit[i]->prepareGPUInputs(problem)); + kernels.push_back( + solution->solve(problem, *(inputs[i]), *hardware)); + } size_t warmupInvocations = listeners.numWarmupRuns(); - size_t eventCount = gpuTimer ? kernels.size() : 0; + size_t eventCount = gpuTimer ? kernels[0].size() : 0; TimingEvents warmupStartEvents(warmupInvocations, eventCount); TimingEvents warmupStopEvents(warmupInvocations, eventCount); @@ -612,18 +689,18 @@ int main(int argc, const char* argv[]) { listeners.preWarmup(); if(gpuTimer) - HIP_CHECK_EXC(adapter.launchKernels(kernels, + HIP_CHECK_EXC(adapter.launchKernels(kernels[0], stream, warmupStartEvents[i], warmupStopEvents[i])); else - HIP_CHECK_EXC( - adapter.launchKernels(kernels, stream, nullptr, nullptr)); + HIP_CHECK_EXC(adapter.launchKernels( + kernels[0], stream, nullptr, nullptr)); listeners.postWarmup(); // Do validation after first warmup if(i == 0) listeners.validateWarmups( - inputs, warmupStartEvents, warmupStopEvents); + inputs[0], warmupStartEvents, warmupStopEvents); } size_t syncs = listeners.numSyncs(); @@ -640,16 +717,19 @@ int main(int argc, const char* argv[]) for(int j = 0; j < enq; j++) { + int flush_index = (j + i * enq + 1) % flush_count; if(gpuTimer) - HIP_CHECK_EXC(adapter.launchKernels( - kernels, stream, startEvents[j], stopEvents[j])); + HIP_CHECK_EXC(adapter.launchKernels(kernels[flush_index], + stream, + startEvents[j], + stopEvents[j])); else HIP_CHECK_EXC(adapter.launchKernels( - kernels, stream, nullptr, nullptr)); + kernels[flush_index], stream, nullptr, nullptr)); } listeners.postEnqueues(startEvents, stopEvents); - listeners.validateEnqueues(inputs, startEvents, stopEvents); + listeners.validateEnqueues(inputs[0], startEvents, stopEvents); } listeners.postSyncs(); diff --git a/Tensile/Source/lib/include/Tensile/Utils.hpp b/Tensile/Source/lib/include/Tensile/Utils.hpp index 024f43098..4f65761e3 100644 --- a/Tensile/Source/lib/include/Tensile/Utils.hpp +++ b/Tensile/Source/lib/include/Tensile/Utils.hpp @@ -29,6 +29,7 @@ #include #include #include +#include #include #include #include @@ -188,6 +189,26 @@ namespace Tensile return concatenate(std::forward(vals)...); } + inline void print_memory_size(size_t memory_size) + { + if(memory_size < 1024) + { + std::cout << std::setprecision(0) << memory_size << " Bytes"; + } + else if(memory_size < 1048576) + { + std::cout << std::setprecision(3) << float(memory_size) / 1024.0f << " KB"; + } + else if(memory_size < 1073741824) + { + std::cout << std::setprecision(6) << float(memory_size) / 1048576.0f << " MB"; + } + else + { + std::cout << std::setprecision(9) << float(memory_size) / 1073741824.0f << " GB"; + } + } + class StreamRead { public: diff --git a/Tensile/Tests/pre_checkin/sgemm_asm_nn.yaml b/Tensile/Tests/pre_checkin/sgemm_asm_nn.yaml index 73daf674f..a52d8c530 100644 --- a/Tensile/Tests/pre_checkin/sgemm_asm_nn.yaml +++ b/Tensile/Tests/pre_checkin/sgemm_asm_nn.yaml @@ -20,6 +20,7 @@ GlobalParameters: DataInitTypeAB: 3 DataInitTypeC: 3 KernelTime: True + FlushCount: 10 BenchmarkProblems: diff --git a/Tensile/Tests/pre_checkin/sgemm_asm_nt.yaml b/Tensile/Tests/pre_checkin/sgemm_asm_nt.yaml index 131c18955..55bd3d49f 100644 --- a/Tensile/Tests/pre_checkin/sgemm_asm_nt.yaml +++ b/Tensile/Tests/pre_checkin/sgemm_asm_nt.yaml @@ -20,6 +20,7 @@ GlobalParameters: DataInitTypeAB: 3 DataInitTypeC: 3 KernelTime: True + FlushMemorySize: 1000000 BenchmarkProblems: From 01a75361782babf640fc34ed12ee24974a19706e Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Sat, 3 Feb 2024 00:00:37 +0900 Subject: [PATCH 44/51] fix rocblas build fail on gfx11 (#1876) - use state["ISA"] for reject conditions instead of globalParameters["CurrentISA"] --- Tensile/SolutionStructs.py | 12 +++++++----- 1 file changed, 7 insertions(+), 5 deletions(-) diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index c84b1b4b3..122f79301 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -2188,6 +2188,7 @@ def setGlobalLoadTileDimClassic(state, tc, numLoads, totalVectorsCoalesced, tota # flexibility in the unroll factors for example. @staticmethod def setGlobalLoadTileDimFractional(state, tc, depthU, glvwOrig): + isa = tuple(state["ISA"]) assert(depthU > 0) dbFract = 0 @@ -2213,10 +2214,10 @@ def setGlobalLoadTileDimFractional(state, tc, depthU, glvwOrig): # and a possible opportunity to handle the lsc grvw = glvwOrig minGrvw = 2 if state["ProblemType"]["DataType"].isHalf() and \ - globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"] else 1 + globalParameters["ArchCaps"][isa]["HasEccHalf"] else 1 # TODO- check this for int8 and fractional load # minGrvw = 4 if state["ProblemType"]["DataType"].isInt8() and \ - # globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"] else 1 + # globalParameters["ArchCaps"][isa]["HasEccHalf"] else 1 bestVw = -1 while grvw >= minGrvw: # Per instruction across the entire group: @@ -2430,6 +2431,7 @@ def checkAndAssignWaveSeparateGlobalRead(state, tc): # determine can we use VgprForLocalReadPacking @staticmethod def isVgprForLocalReadPackingDoable(state): + isa = tuple(state["ISA"]) rejectComment = "" doable = True # MatrixInstruction only @@ -2437,7 +2439,7 @@ def isVgprForLocalReadPackingDoable(state): rejectComment = "VgprForLocalReadPacking is for MatrixInstruction only" doable = False # only for HasEccHalf - if not globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"]: + if not globalParameters["ArchCaps"][isa]["HasEccHalf"]: rejectComment = "VgprForLocalReadPacking is for EccHalf only" doable = False # only for SIA=3 + PLR>=1 @@ -3368,7 +3370,7 @@ def assignDerivedParameters(state): # Vector-width must be at least 2 for Half (since unroll loop uses packed operations?) if (not state["EnableMatrixInstruction"]) and state["VectorWidth"] < 2: reject(state, "VectorWidth must be >= 2 for half") - if globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"]: + if globalParameters["ArchCaps"][isa]["HasEccHalf"]: if not state["ProblemType"]["HighPrecisionAccumulate"] and state["AssertFree0ElementMultiple"] % 2 != 0: # beta-on-edge has AF0EM requirement except for HPA kernels reject(state, "Archs with HasEccHalf require AF0EM%2==0 except for HPA kernels") @@ -3667,7 +3669,7 @@ def assignDerivedParameters(state): if validDepthU and state["KernelLanguage"] == "Assembly" \ and (state["ProblemType"]["DataType"].isHalf() \ or state["ProblemType"]["DataType"].isBFloat16()): - if globalParameters["ArchCaps"][globalParameters["CurrentISA"]]["HasEccHalf"]: + if globalParameters["ArchCaps"][isa]["HasEccHalf"]: if state["GlobalLoadVectorWidthA"] <= 1 or state["GlobalLoadVectorWidthB"] <= 1: reject(state, "HalfEcc requires GLVWA > 1") From 92ad5d743452b05951057beb3d5c964b2b0f3dbf Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Sat, 3 Feb 2024 01:13:26 +0900 Subject: [PATCH 45/51] skip sgemm 64bit offset tests for gfx94x (#1878) --- Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset.yaml | 2 +- Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset_post.yaml | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset.yaml b/Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset.yaml index ffe00f1c8..9cb1a3c31 100644 --- a/Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset.yaml +++ b/Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx940, skip-gfx941, skip-gfx942, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 diff --git a/Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset_post.yaml b/Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset_post.yaml index a719dab85..a92a66909 100644 --- a/Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset_post.yaml +++ b/Tensile/Tests/pre_checkin/mfma/sgemm_64bit_offset_post.yaml @@ -1,5 +1,5 @@ TestParameters: - marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch + marks: [skip-gfx900, skip-gfx906, skip-gfx908, skip-gfx940, skip-gfx941, skip-gfx942, skip-gfx1010, skip-gfx1011, skip-gfx1012, skip-gfx1030, skip-gfx1100, skip-gfx1101, skip-gfx1102] # not supported by arch GlobalParameters: NumElementsToValidate: -1 From 6cc51b4bc885f5677b8bfc47005fd6741c0ad899 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Tue, 6 Feb 2024 02:00:24 +0900 Subject: [PATCH 46/51] Revert "Use fallback libraries for archs without optimized logic (#1862)" (#1879) This reverts commit efbe0c0caeedcf03776ae4e6a0067d88e38da211. --- Tensile/TensileCreateLibrary.py | 7 ------- 1 file changed, 7 deletions(-) diff --git a/Tensile/TensileCreateLibrary.py b/Tensile/TensileCreateLibrary.py index 58751082d..f28ba3119 100644 --- a/Tensile/TensileCreateLibrary.py +++ b/Tensile/TensileCreateLibrary.py @@ -940,18 +940,11 @@ def generateLogicDataAndSolutions(logicFiles, args): # logicData[problemType].append((scheduleName, deviceNames, \ # solutionsForSchedule, indexOrder, exactLogic, rangeLogic )) - (archs, _) = splitArchs() if globalParameters["SeparateArchitectures"] or globalParameters["LazyLibraryLoading"]: if "fallback" in masterLibraries.keys(): for key, value in masterLibraries.items(): if key != "fallback": value.merge(deepcopy(masterLibraries["fallback"])) - for archName in archs: - archName = archName.split('-', 1)[0] - if archName not in masterLibraries: - print1("Using fallback for arch: " + archName) - masterLibraries[archName] = deepcopy(masterLibraries["fallback"]) - masterLibraries[archName].version = args.version masterLibraries.pop("fallback") From 11c67dbc5bdcf55b06c3b4315d28f064ee90cc20 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Tue, 6 Feb 2024 06:14:27 +0900 Subject: [PATCH 47/51] fix mismatch issue with GlobalReadCoalesceGroup (#1875) - fixed mismatch issue with GlobalReadCoalesceGroup==0 + WaveSeparateGlobalRead - fixed mismatch issue with DirectToVgpr --- Tensile/KernelWriterAssembly.py | 15 ++++++++++----- Tensile/SolutionStructs.py | 11 +++-------- 2 files changed, 13 insertions(+), 13 deletions(-) diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index 1e74f5a47..c036b4ea6 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -4059,9 +4059,7 @@ def graTileAssignment(self, kernel, tP): divisorName = tP["lvp"] divisor = kernel[divisorName] - # force to swap gro-tile and gro-unroll for DirectToVgpr + TLU=False - forceSwap = (kernel["DirectToVgpr%s"%tc] and not tP["tlu"]) - if tP["grcg"] == tP["tlu"] or forceSwap: + if tP["grcg"] == tP["tlu"]: rReg = self.vgprPool.checkOut(1, "graTA rReg0", self.preventVgprOverflowDuringNewTile) # gro-tile = serial%divisor qReg = self.vgprPool.checkOut(1, "graTA qReg0", self.preventVgprOverflowDuringNewTile) # gro-unroll = serial/divisor tReg = rReg @@ -4102,6 +4100,13 @@ def graTileAssignment(self, kernel, tP): divisorVal //= kernel["ThreadSeparateGlobalRead%s"%tc] * 2 dividendReg = self.vgprPool.checkOut(1, "idInWave", self.preventVgprOverflowDuringNewTile) kStr += vectorStaticRemainder(dividendReg, "Serial", divisorVal, tmpSgpr) + # vgpr for WaveSeparateGlobalRead + add back to column index + if tP["tlu"]: + # tlu case, add wave offset to uReg + wqreg = uReg + else: + # no tlu case, add wave offset to tReg + wqreg = tReg # store DirectToVgpr K interval for later use dtvKInterval = 1 @@ -4217,7 +4222,7 @@ def graTileAssignment(self, kernel, tP): kStr += inst("s_lshr_b32", sgpr(tmpSgpr), sgpr(tmpSgpr), hex(log2(self.kernel["WavefrontSize"])), "WaveId") kStr += inst("s_mul_i32", sgpr(tmpSgpr), sgpr(tmpSgpr), (kernel["WavefrontSize"] // divisor), \ "Global Read Wave: each wave loads continuous WavefrontSize(%u)/divisor(%u) columns" % (kernel["WavefrontSize"], divisor)) - kStr += inst("_v_add_u32", vgpr(qReg), sgpr(tmpSgpr), vgpr(qReg), \ + kStr += inst("_v_add_u32", vgpr(wqreg), sgpr(tmpSgpr), vgpr(wqreg), \ "Global Read Wave: add back to column index") self.vgprPool.checkIn(dividendReg) @@ -4226,7 +4231,7 @@ def graTileAssignment(self, kernel, tP): kStr += inst("s_lshr_b32", sgpr(tmpSgpr), sgpr(tmpSgpr), hex(log2(kernel["WavefrontSize"])), "WaveId") kStr += inst("s_mul_i32", sgpr(tmpSgpr), sgpr(tmpSgpr), kernel[tP["lsp"]] * tP["nrp"], \ "Global Read Wave: each wave loads continuous lsp(%u)*nrp(%u) columns" % (kernel[tP["lsp"]], tP["nrp"])) - kStr += inst("_v_add_u32", vgpr(qReg), sgpr(tmpSgpr), vgpr(qReg), \ + kStr += inst("_v_add_u32", vgpr(wqreg), sgpr(tmpSgpr), vgpr(wqreg), \ "Global Read Wave: add back to column index") self.vgprPool.checkIn(dividendReg) diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index 122f79301..9a6392646 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -2588,6 +2588,9 @@ def isDirectToVgprDoable(state, tc): reject(state, "DirectToVgpr%c does not supports TLU = UnrollMajorLDS"%(tc)) return False + # force GlobalReadCoalesceGroup == TLU in DTV case + state["GlobalReadCoalesceGroup%s"%tc] = state["ProblemType"]["TLU%c"%tc] + # Does not work with DirectToLDS # -> this will be checked after DirectToLDS doable check is done @@ -3273,14 +3276,6 @@ def assignDerivedParameters(state): #print "staggerStrideShift=", staggerStrideShift, "depthu=", state["DepthU"] state["_staggerStrideShift"] = staggerStrideShift - # force GlobalReadCoalesceGroupA, B = True until we fix fail with trsm (TODO: re-enable) - if not state["GlobalReadCoalesceGroupA"]: - print2("GlobalReadCoalesceGroupA=False not supported for now. Force to True") - state["GlobalReadCoalesceGroupA"] = True - if not state["GlobalReadCoalesceGroupB"]: - print2("GlobalReadCoalesceGroupB=False not supported for now. Force to True") - state["GlobalReadCoalesceGroupB"] = True - # Use GlobalReadVectorWidth if it is not -1 if state["GlobalReadVectorWidth"] != -1: state["GlobalLoadVectorWidthA"] = state["GlobalReadVectorWidth"] From 5de0457ad4a5acd5b508a64c424387c11fb99acd Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Mon, 5 Feb 2024 18:01:01 -0700 Subject: [PATCH 48/51] Fix BufferLoad=False with stream-k (#1877) --- Tensile/KernelWriterAssembly.py | 20 ++++- .../extended/stream_k/sk_2tile_sgemm.yaml | 80 +++++++++++++++++++ 2 files changed, 98 insertions(+), 2 deletions(-) diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index c036b4ea6..c48d33f3a 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -5145,8 +5145,24 @@ def graAddresses(self, kernel, tP, isPap=False): #kStr += self.bomb(0x13) # after addresses and SRD set else: tmp = self.vgprPool.checkOut(2, "tmp", self.preventVgprOverflowDuringNewTile) - kStr += inst("v_mov_b32", vgpr(tmp+0), sgpr("Address%s+0"%tP["tensorChar"]), "" ) - kStr += inst("v_mov_b32", vgpr(tmp+1), sgpr("Address%s+1"%tP["tensorChar"]), "" ) + + if kernel["StreamK"]: + # StreamK partial tile - offset to tile start index + tmpOffset = self.sgprPool.checkOut(2, "skStartOffset", preventOverflow=0) + kStr += inst("s_mul_i32", sgpr(tmpOffset), sgpr("StreamKLocalStart"), "DepthU*%d"%(tP["bpe"]), "StreamK tile start offset") + strideL = self.strideRef(tc, kernel["ProblemType"]["IndicesSummation"][0]) + kStr += self.s_mul_u64_u32(sgpr(tmpOffset), sgpr(tmpOffset+1), sgpr(tmpOffset), strideL, "StreamK tile start offset") + if kernel["CheckDimOverflow"] >=2: + kStr += self.assert_eq(sgpr(tmpOffset+1),0) + kStr += inst("s_add_u32", sgpr(tmpOffset+0), sgpr(tmpOffset+0), sgpr("Address%s+0"%tP["tensorChar"]), "accum skOffset term to tilestart") + kStr += inst("s_addc_u32", sgpr(tmpOffset+1), sgpr(tmpOffset+1), sgpr("Address%s+1"%tP["tensorChar"]), "accum skOffset term to tilestart") + kStr += inst("v_mov_b32", vgpr(tmp+0), sgpr(tmpOffset+0), "" ) + kStr += inst("v_mov_b32", vgpr(tmp+1), sgpr(tmpOffset+1), "" ) + self.sgprPool.checkIn(tmpOffset) + else: + kStr += inst("v_mov_b32", vgpr(tmp+0), sgpr("Address%s+0"%tP["tensorChar"]), "" ) + kStr += inst("v_mov_b32", vgpr(tmp+1), sgpr("Address%s+1"%tP["tensorChar"]), "" ) + for perp in range(0, tP["nrp"]): for sPerp in range(0, tP["nrpv"]): for para in range(0, tP["nrc"]): diff --git a/Tensile/Tests/extended/stream_k/sk_2tile_sgemm.yaml b/Tensile/Tests/extended/stream_k/sk_2tile_sgemm.yaml index fd62b0f92..4b2b2bbac 100644 --- a/Tensile/Tests/extended/stream_k/sk_2tile_sgemm.yaml +++ b/Tensile/Tests/extended/stream_k/sk_2tile_sgemm.yaml @@ -111,3 +111,83 @@ BenchmarkProblems: - Exact: [ 4103, 4103, 3, 1024 ] - Exact: [ 4096, 4096, 3, 1031 ] - Exact: [ 4103, 4103, 3, 1031 ] + + - # BufferLoad False tests + InitialSolutionParameters: + BenchmarkCommonParameters: + - KernelLanguage: ["Assembly"] + - EdgeType: ["ShiftPtr"] + - PrefetchLocalRead: [True] + ForkParameters: + - MatrixInstruction: + # - [32, 32, 2, 1, 1, 2,2, 2,2] + # - [32, 32, 2, 1, 1, 3,3, 2,2] + - [32, 32, 2, 1, 1, 4,4, 2,2] + # - [32, 32, 2, 1, 1, 2,1, 2,2] + # - [32, 32, 2, 1, 1, 1,1, 2,2] + # - [16, 16, 4, 1, 1, 3,3, 2,2] + # - [16, 16, 4, 1, 1, 4,1, 2,2] + # - [16, 16, 4, 1, 1, 4,2, 2,2] + - [16, 16, 4, 1, 1, 4,4, 2,2] + # - [16, 16, 4, 1, 1, 8,8, 2,2] + # - [16, 16, 4, 1, 1, 2,2, 2,2] + # - [16, 16, 4, 1, 1, 2,1, 2,2] + # - [16, 16, 4, 1, 1, 1,1, 2,2] + - ThreadTile: + - [ 1, 32 ] + - WorkGroup: + - [ 16, 16, 1 ] + # - WorkGroupMapping: [0, 1, 2, 4, 8, 16, 32, 64] # works + - WorkGroupMapping: [0, 8] + - GlobalSplitU: [1] + - DepthU: [ 8 ] + - BufferLoad: [False] + # - DepthU: [ 8, 16, 32 ] + # - DepthU: [ 8, 12, 16, 32 ] + # - DepthU: [ 2, 4, 8, 16, 32, 64 ] + # - DepthU: [ 8, 9, 10, 11, 12, 13, 14, 15, 16 ] # depthu 14 failed a test + - VectorWidth: [1] + - StreamK: [3] + - StaggerU: [0, 32] + # - StaggerU: [0] + - ScheduleIterAlg: [3] + # - SourceSwap: [False, True] + - SourceSwap: [False] + # - ExpandPointerSwap: [False, True] + # - ExpandPointerSwap: [False] + - PrefetchLocalRead: [3, 5] + # - PrefetchLocalRead: [1, 3, 5, 9, 13, 17] + # - PrefetchLocalRead: [1, 9, 10, 11, 12, 13, 14, 15, 16, 17] + # - PrefetchGlobalRead: [1, 2] + - PrefetchGlobalRead: [1] + # - 1LDSBuffer: [0, 1] + # - 1LDSBuffer: [1] + # - EdgeType: ["Branch", "ShiftPtr"] + # - EdgeType: ["ShiftPtr"] + # - MIArchVgpr: [0, 1] + # - MIArchVgpr: [1] + # - StoreVectorWidth: [4, 1] + - StoreVectorWidth: [4] + # - NumElementsPerBatchStore: [0, 2, 4, 8] + # - NumElementsPerBatchStore: [8] + # - AssertAlphaValue: [1] + + BenchmarkForkParameters: + JoinParameters: + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Exact: [ 512, 512, 1, 512 ] + - Exact: [ 4096, 4096, 1, 1024 ] + # - Exact: [ 4103, 4096, 1, 1024 ] + # - Exact: [ 4096, 4103, 1, 1024 ] + # - Exact: [ 4103, 4103, 1, 1024 ] + # - Exact: [ 4096, 4096, 1, 1031 ] + - Exact: [ 4103, 4103, 1, 1031 ] + - Exact: [ 512, 512, 3, 512 ] + - Exact: [ 4096, 4096, 3, 1024 ] + # - Exact: [ 4103, 4096, 3, 1024 ] + # - Exact: [ 4096, 4103, 3, 1024 ] + # - Exact: [ 4103, 4103, 3, 1024 ] + # - Exact: [ 4096, 4096, 3, 1031 ] + - Exact: [ 4103, 4103, 3, 1031 ] From 6dfe230027082e1bde705143c23e9a6494c493ae Mon Sep 17 00:00:00 2001 From: Alex Brown Date: Wed, 7 Feb 2024 10:49:46 -0700 Subject: [PATCH 49/51] Disable InitAccVgprOpt for Stream-K (#1880) --- Tensile/KernelWriter.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/Tensile/KernelWriter.py b/Tensile/KernelWriter.py index a2e490218..5e31fb5a2 100644 --- a/Tensile/KernelWriter.py +++ b/Tensile/KernelWriter.py @@ -4257,7 +4257,8 @@ def initKernel(self, kernel, tensorParametersA, tensorParametersB ): self.useInitAccVgprOpt = False # enable for the following conditions if kernel["EnableMatrixInstruction"] and (kernel["PrefetchGlobalRead"] == 1 or kernel["PrefetchGlobalRead"] == 2) \ - and globalParameters["AsmCaps"][globalParameters["CurrentISA"]]["HasMFMA_constSrc"]: + and globalParameters["AsmCaps"][globalParameters["CurrentISA"]]["HasMFMA_constSrc"] \ + and kernel["StreamK"] == 0: self.useInitAccVgprOpt = True # force to disable for the following conditions if self.useInitAccVgprOpt: From 8fdd9cdbb13d573431ccd30a1f560977939b4bce Mon Sep 17 00:00:00 2001 From: Scott Quiring <44450689+sdquiring@users.noreply.github.com> Date: Wed, 7 Feb 2024 11:36:12 -0700 Subject: [PATCH 50/51] Kernarg preloading (#1843) Kernarg preloading is OFF by default, it can be enabled if it's supported by the GPU/remaining kernel parameters. The kernel parameter DelayRemainingArguments specifies whether we should initiate the load of the remaining (non-preloaded) arguments at the beginning of the kernel or after we've initiated the first loads of A and B. This feature only supports a small set of kernel parameters. If it proves useful it might be possible to expand for example, only preload the A related arguments if we need some of the sizes. Other things that were changed: The ASM cap cache has been moved to its own file (AsmCaps.py). If the PrintLevel is >= 1 and the cache is out of date, the output will include what that file should now contain. The AsmRegisterPool now keeps track of which registers are arguments and which are preloaded This is used to generate the metadata in the signature. We should not be allocating registers for unused arguments and then immediately freeing them. This was always a potential bug but these changes caused this to create an actual problem The solution is to conditionally send these arguments in/allocate them. This is now the case and it should be maintained going forward. * Auto generate argument signature. * Update custom kernel to load args as they're sent in now. * Switch default value for PKA to 0, add -1 'auto' mode --- .jenkins/common.groovy | 2 +- Tensile/AsmCaps.py | 715 ++++++++++++++++++ Tensile/AsmRegisterPool.py | 212 ++++-- Tensile/Common.py | 59 +- Tensile/Components/Signature.py | 142 +--- Tensile/Contractions.py | 4 + ...128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s | 6 +- Tensile/KernelWriter.py | 4 +- Tensile/KernelWriterAssembly.py | 348 +++++---- Tensile/Parallel.py | 2 +- Tensile/SolutionStructs.py | 52 ++ .../include/Tensile/ContractionSolution.hpp | 1 + .../Serialization/ContractionSolution.hpp | 1 + .../Source/lib/source/ContractionSolution.cpp | 97 ++- .../lib/source/hip/HipSolutionAdapter.cpp | 6 - .../preload_kernel_arguments_always_half.yaml | 56 ++ ..._kernel_arguments_half_bfloat16_sgemm.yaml | 175 +++++ 17 files changed, 1475 insertions(+), 407 deletions(-) create mode 100644 Tensile/AsmCaps.py create mode 100644 Tensile/Tests/pre_checkin/preload_kernel_arguments_always_half.yaml create mode 100644 Tensile/Tests/pre_checkin/preload_kernel_arguments_half_bfloat16_sgemm.yaml diff --git a/.jenkins/common.groovy b/.jenkins/common.groovy index e24a645c4..32fb8d9f5 100644 --- a/.jenkins/common.groovy +++ b/.jenkins/common.groovy @@ -121,7 +121,7 @@ def runTestCommand (platform, project, jobName, test_marks, boolean skipHostTest String compiler = 'hipcc' String pythonVersion = 'py3' String markSkipHostTest = skipHostTest ? "#" : "" - String markSkipExtendedTest = !test_marks.contains("extended") ? "--gtest_filter=-\"*Extended*\"" : "" + String markSkipExtendedTest = !test_marks.contains("extended") ? "\"--gtest_filter=-*Extended*:*Ocl*\"" : "\"--gtest_filter=-*Ocl*\"" def command = """#!/usr/bin/env bash set -x diff --git a/Tensile/AsmCaps.py b/Tensile/AsmCaps.py new file mode 100644 index 000000000..fa61708b4 --- /dev/null +++ b/Tensile/AsmCaps.py @@ -0,0 +1,715 @@ +CACHED_ASM_CAPS = \ +{(0, 0, 0): {'HasAddLshl': False, + 'HasAtomicAdd': False, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': False, + 'HasExplicitCO': False, + 'HasExplicitNC': False, + 'HasGLCModifier': False, + 'HasLshlOr': False, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': False, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 0, + 'SupportedISA': False, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': False, + 'v_dot2_f32_f16': False, + 'v_dot2c_f32_f16': False, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': False, + 'v_fma_f16': False, + 'v_fma_f32': False, + 'v_fma_f64': False, + 'v_fma_mix_f32': False, + 'v_fmac_f16': False, + 'v_fmac_f32': False, + 'v_mac_f16': False, + 'v_mac_f32': False, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': False, + 'v_pk_fmac_f16': False}, + (8, 0, 3): {'HasAddLshl': False, + 'HasAtomicAdd': False, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': False, + 'HasExplicitNC': False, + 'HasGLCModifier': True, + 'HasLshlOr': False, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': False, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 15, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': False, + 'v_dot2_f32_f16': False, + 'v_dot2c_f32_f16': False, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': False, + 'v_fma_f16': False, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': False, + 'v_fmac_f16': False, + 'v_fmac_f32': False, + 'v_mac_f16': True, + 'v_mac_f32': True, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': False, + 'v_pk_fmac_f16': False}, + (9, 0, 0): {'HasAddLshl': True, + 'HasAtomicAdd': False, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': False, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': False, + 'v_dot2_f32_f16': False, + 'v_dot2c_f32_f16': False, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': False, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': False, + 'v_fmac_f16': False, + 'v_fmac_f32': False, + 'v_mac_f16': True, + 'v_mac_f32': True, + 'v_mad_mix_f32': True, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (9, 0, 6): {'HasAddLshl': True, + 'HasAtomicAdd': False, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': False, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': False, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': False, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': True, + 'v_mac_f32': True, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (9, 0, 8): {'HasAddLshl': True, + 'HasAtomicAdd': True, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': False, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': True, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': True, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': True, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': True, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': True, + 'v_mac_f32': True, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (9, 0, 10): {'HasAddLshl': True, + 'HasAtomicAdd': True, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': False, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': True, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': True, + 'HasMFMA_bf16_original': True, + 'HasMFMA_constSrc': True, + 'HasMFMA_f64': True, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': True, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': True, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': True, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': True, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': True, + 'v_mac_f32': True, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (9, 4, 0): {'HasAddLshl': True, + 'HasAtomicAdd': True, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': False, + 'HasGLCModifier': False, + 'HasLshlOr': True, + 'HasMFMA': True, + 'HasMFMA_b8': True, + 'HasMFMA_bf16_1k': True, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': True, + 'HasMFMA_f64': True, + 'HasMFMA_f8': True, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': True, + 'HasMFMA_vgpr': True, + 'HasMFMA_xf32': True, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': True, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': True, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': True, + 'v_mac_f32': False, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (9, 4, 1): {'HasAddLshl': True, + 'HasAtomicAdd': True, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': False, + 'HasGLCModifier': False, + 'HasLshlOr': True, + 'HasMFMA': True, + 'HasMFMA_b8': True, + 'HasMFMA_bf16_1k': True, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': True, + 'HasMFMA_f64': True, + 'HasMFMA_f8': True, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': True, + 'HasMFMA_vgpr': True, + 'HasMFMA_xf32': True, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': True, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': True, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': True, + 'v_mac_f32': False, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (9, 4, 2): {'HasAddLshl': True, + 'HasAtomicAdd': True, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': False, + 'HasGLCModifier': False, + 'HasLshlOr': True, + 'HasMFMA': True, + 'HasMFMA_b8': True, + 'HasMFMA_bf16_1k': True, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': True, + 'HasMFMA_f64': True, + 'HasMFMA_f8': True, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': True, + 'HasMFMA_vgpr': True, + 'HasMFMA_xf32': True, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': True, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': True, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': True, + 'v_mac_f32': False, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (10, 1, 0): {'HasAddLshl': True, + 'HasAtomicAdd': False, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': True, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': False, + 'v_dot2_f32_f16': False, + 'v_dot2c_f32_f16': False, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': False, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': False, + 'v_mac_f32': True, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (10, 1, 1): {'HasAddLshl': True, + 'HasAtomicAdd': False, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': True, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': True, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': False, + 'v_mac_f32': True, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (10, 1, 2): {'HasAddLshl': True, + 'HasAtomicAdd': False, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': True, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': True, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': False, + 'v_mac_f32': True, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (10, 3, 0): {'HasAddLshl': True, + 'HasAtomicAdd': False, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': True, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': True, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': False, + 'v_mac_f32': False, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (10, 3, 1): {'HasAddLshl': True, + 'HasAtomicAdd': False, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': True, + 'HasExplicitCO': True, + 'HasExplicitNC': True, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': False, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': True, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': True, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': False, + 'v_mac_f32': False, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (11, 0, 0): {'HasAddLshl': True, + 'HasAtomicAdd': True, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': False, + 'HasExplicitCO': True, + 'HasExplicitNC': True, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': True, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': False, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': False, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': False, + 'v_mac_f32': False, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (11, 0, 1): {'HasAddLshl': True, + 'HasAtomicAdd': True, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': False, + 'HasExplicitCO': True, + 'HasExplicitNC': True, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': True, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': False, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': False, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': False, + 'v_mac_f32': False, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}, + (11, 0, 2): {'HasAddLshl': True, + 'HasAtomicAdd': True, + 'HasDirectToLdsDest': False, + 'HasDirectToLdsNoDest': False, + 'HasExplicitCO': True, + 'HasExplicitNC': True, + 'HasGLCModifier': True, + 'HasLshlOr': True, + 'HasMFMA': False, + 'HasMFMA_b8': False, + 'HasMFMA_bf16_1k': False, + 'HasMFMA_bf16_original': False, + 'HasMFMA_constSrc': False, + 'HasMFMA_f64': False, + 'HasMFMA_f8': False, + 'HasMFMA_i8_908': False, + 'HasMFMA_i8_940': False, + 'HasMFMA_vgpr': False, + 'HasMFMA_xf32': False, + 'HasSMulHi': True, + 'HasWMMA': True, + 'KernargPreloading': False, + 'MaxLgkmcnt': 15, + 'MaxVmcnt': 63, + 'SupportedISA': True, + 'SupportedSource': True, + 'VOP3v_dot4_i32_i8': False, + 'v_dot2_f32_f16': True, + 'v_dot2c_f32_f16': True, + 'v_dot4_i32_i8': False, + 'v_dot4c_i32_i8': False, + 'v_fma_f16': True, + 'v_fma_f32': True, + 'v_fma_f64': True, + 'v_fma_mix_f32': True, + 'v_fmac_f16': False, + 'v_fmac_f32': True, + 'v_mac_f16': False, + 'v_mac_f32': False, + 'v_mad_mix_f32': False, + 'v_pk_fma_f16': True, + 'v_pk_fmac_f16': False}} diff --git a/Tensile/AsmRegisterPool.py b/Tensile/AsmRegisterPool.py index d1f53ec0a..ec5e166da 100644 --- a/Tensile/AsmRegisterPool.py +++ b/Tensile/AsmRegisterPool.py @@ -43,12 +43,16 @@ class Status(Enum): Unavailable = 0 Available = 1 InUse = 2 + AvailableForPreload = 3 class Register: def __init__(self, status, tag): self.status = status self.tag = tag + def __repr__(self) -> str: + return f"({self.status}, {self.tag})" + ######################################## # Init # defaultPreventOverflow: control behavior of checkout and checkoutAligned when preventOverflow is not explicitly specificed. @@ -57,8 +61,48 @@ def __init__(self, size, type, defaultPreventOverflow, printRP=0): self.type = type self.defaultPreventOverflow = defaultPreventOverflow self.pool = [self.Register(RegisterPool.Status.Unavailable, "init") for i in range(0,size)] + + # Map from register number -> size, deleted/overwritten when deallocated self.checkOutSize = {} + # Map from tag -> size, not deleted. + self.checkOutSizeCache = {} + + # First register that's part of the manually loaded kernargs + self.kernargStart = None + # Last+1 register that's part of the manually loaded kernargs + self.kernargEnd = None + + # First register that's part of the preloaded kernargs + self.preloadStart = None + # Last+1 register that's part of the preloaded kernargs + self.preloadEnd = None + + # Each of the preloaded kernargs' name and size + self.preloadedKernargs = [] + # Each of the manually loaded kernargs' name and size + self.selfLoadedKernargs = [] + + + @property + def numKernargSGPRs(self): + if self.kernargStart is None: + assert self.kernargEnd is None + return 0 + return self.kernargEnd - self.kernargStart + + @property + def numPreloadSGPRs(self): + if self.preloadStart is None: + assert self.preloadEnd is None + return 0 + return self.preloadEnd - self.preloadStart + + @property + def kernargs(self): + from itertools import chain + return chain(self.preloadedKernargs, self.selfLoadedKernargs) + ######################################## # Adds registers to the pool so they can be used as temps # Convenience function that takes a range and returns it in string form @@ -72,7 +116,7 @@ def addRange(self, start, stop, tag=""): ######################################## # Adds registers to the pool so they can be used as temps # Add - def add(self, start, size, tag=""): + def add(self, start, size, tag="", newStatus=Status.Available): # reserve space if self.printRP: print("RP::add(%u..%u for '%s')"%(start,start+size-1,tag)) @@ -84,7 +128,7 @@ def add(self, start, size, tag=""): # mark as available for i in range(start, start+size): if self.pool[i].status == RegisterPool.Status.Unavailable: - self.pool[i].status = RegisterPool.Status.Available + self.pool[i].status = newStatus self.pool[i].tag = tag elif self.pool[i].status == RegisterPool.Status.Available: printWarning("RegisterPool::add(%u,%u) pool[%u](%s) already available" % (start, size, i, self.pool[i].tag)) @@ -121,79 +165,109 @@ def remove(self, start, size, tag=""): def checkOut(self, size, tag="_untagged_", preventOverflow=-1): return self.checkOutAligned(size, 1, tag, preventOverflow) - def checkOutAligned(self, size, alignment, tag="_untagged_aligned_", preventOverflow=-1): + def isRangeAvailable(self, start, size, preventOverflow=-1, wantedStatus=Status.Available) -> bool: + end = start + size if preventOverflow == -1: preventOverflow = self.defaultPreventOverflow - assert(size > 0) - found = -1 - for i in range(0, len(self.pool)): - # alignment + + if preventOverflow and end > len(self.pool): + return False + + end = min(end, len(self.pool)) + + for i in range(start, end): + if self.pool[i].status != wantedStatus: + return False + + return True + + def findFreeRange(self, size, alignment, preventOverflow=-1, wantedStatus=Status.Available): + if preventOverflow == -1: + preventOverflow = self.defaultPreventOverflow + + for i in range(len(self.pool)+1): if i % alignment != 0: continue - # enough space - if i + size > len(self.pool): - continue - # all available - allAvailable = True - for j in range(0, size): - if self.pool[i+j].status != RegisterPool.Status.Available: - allAvailable = False - i = j+1 - break - if allAvailable: - found = i - break - else: - continue + if self.isRangeAvailable(i, size, preventOverflow, wantedStatus): + return i - # success without overflowing - if found > -1: - #print "Found: %u" % found - for i in range(found, found+size): - self.pool[i].status = RegisterPool.Status.InUse - self.pool[i].tag = tag - self.checkOutSize[found] = size - if self.printRP: - print("RP::checkOut '%s' (%u,%u) @ %u avail=%u"%(tag, size,alignment, found, self.available())) - #print self.state() - return found - # need overflow + if preventOverflow: + return None else: - #print "RegisterPool::checkOutAligned(%u,%u) overflowing past %u" % (size, alignment, len(self.pool)) - # where does tail sequence of available registers begin - assert (not preventOverflow) - start = len(self.pool) - for i in range(len(self.pool)-1, 0, -1): - if self.pool[i].status == RegisterPool.Status.Available: - self.pool[i].tag = tag - start = i - continue - else: - break - #print "Start: ", start - # move forward for alignment - - start = roundUpToNearestMultiple(start,alignment) - #print "Aligned Start: ", start - # new checkout can begin at start - newSize = start + size - oldSize = len(self.pool) - overflow = newSize - oldSize - #print "Overflow: ", overflow - for i in range(start, len(self.pool)): - self.pool[i].status = RegisterPool.Status.InUse - self.pool[i].tag = tag - for i in range(0, overflow): - if len(self.pool) < start: - # this is padding to meet alignment requirements - self.pool.append(self.Register(RegisterPool.Status.Available,tag)) - else: - self.pool.append(self.Register(RegisterPool.Status.InUse,tag)) - self.checkOutSize[start] = size - if self.printRP: - print(self.state()) - print("RP::checkOut' %s' (%u,%u) @ %u (overflow)"%(tag, size, alignment, start)) - return start + loc = self.startOfLastAvailableBlock() + return roundUpToNearestMultiple(loc, alignment) + + def checkOutAt(self, start, size, tag, preventOverflow, wantedStatus = Status.Available): + if preventOverflow: + assert start + size <= len(self.pool) + + assert self.isRangeAvailable(start, size, preventOverflow, wantedStatus=wantedStatus) + + end = start + size + + numToAdd = max(0, end - len(self.pool)) + if numToAdd > 0: + self.add(len(self.pool), numToAdd) + + for i in range(start, end): + assert self.pool[i].status == wantedStatus + + for i in range(start, end): + self.pool[i].status = RegisterPool.Status.InUse + self.pool[i].tag = tag + self.checkOutSize[start] = size + self.checkOutSizeCache[tag] = size + + def startOfLastAvailableBlock(self) -> int: + """ Returns the index of the first available register in the highest-numbered free block of registers. """ + for i in range(len(self.pool)-1, 0, -1): + if self.pool[i].status != RegisterPool.Status.Available: + return i+1 + return len(self.pool) + + def checkOutAligned(self, size, alignment, tag="_untagged_aligned_", preventOverflow=-1, kernarg=False, preload=False): + if preventOverflow == -1: + preventOverflow = self.defaultPreventOverflow + assert size > 0 + + if kernarg: + assert not preventOverflow + entry = {"name": tag, "size": size} + if preload: + self.preloadedKernargs.append(entry) + else: + self.selfLoadedKernargs.append(entry) + + if preload: + loc = self.findFreeRange(size, alignment, True, RegisterPool.Status.AvailableForPreload) + if self.preloadStart is None: + assert loc == 2, "Assume that preloaded kernargs start at s2" + self.preloadStart = loc + else: + assert loc == self.preloadEnd + + self.preloadEnd = loc + size + assert loc is not None + self.checkOutAt(loc, size, tag, True, wantedStatus=RegisterPool.Status.AvailableForPreload) + return loc + + if kernarg: + assert not preventOverflow + if self.kernargStart is None: + loc = self.startOfLastAvailableBlock() + loc = roundUpToNearestMultiple(loc, alignment) + self.kernargStart = loc + else: + loc = roundUpToNearestMultiple(self.kernargEnd, alignment) + + self.kernargEnd = loc + size + self.checkOutAt(loc, size, tag, preventOverflow) + return loc + + loc = self.findFreeRange(size, alignment, preventOverflow) + assert loc is not None + self.checkOutAt(loc, size, tag, preventOverflow) + return loc def initTmps(self, initValue, start=0, stop=-1): kStr = "" diff --git a/Tensile/Common.py b/Tensile/Common.py index 0d957c9ce..6ececf1c4 100644 --- a/Tensile/Common.py +++ b/Tensile/Common.py @@ -26,6 +26,7 @@ from . import Parallel from collections import OrderedDict from copy import deepcopy +from .AsmCaps import CACHED_ASM_CAPS import math @@ -308,26 +309,6 @@ 'gfx1100':'navi31', 'gfx1101':'navi32', 'gfx1102':'navi33' } -CACHED_ASM_CAPS = { - (8, 0, 3): {'SupportedISA': True, 'HasExplicitCO': False, 'HasExplicitNC': False, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': False, 'HasLshlOr': False, 'HasSMulHi': False, 'HasWMMA': False, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': True, 'v_fma_f16': False, 'v_fmac_f16': False, 'v_pk_fma_f16': False, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': False, 'v_dot2_f32_f16': False, 'v_dot2c_f32_f16': False, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': False, 'VOP3v_dot4_i32_i8': False, 'v_mac_f32': True, 'v_fma_f32': True, 'v_fmac_f32': False, 'v_fma_f64': True, 'HasAtomicAdd': False, 'HasGLCModifier': True, 'MaxVmcnt': 15, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (9, 0, 0): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': False, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': True, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': True, 'v_fma_mix_f32': False, 'v_dot2_f32_f16': False, 'v_dot2c_f32_f16': False, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': False, 'VOP3v_dot4_i32_i8': False, 'v_mac_f32': True, 'v_fma_f32': True, 'v_fmac_f32': False, 'v_fma_f64': True, 'HasAtomicAdd': False, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (9, 0, 6): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': False, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': True, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': False, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': False, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': True, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': False, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (9, 0, 8): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': False, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': True, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': True, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': True, 'HasMFMA_i8_940': False, 'v_mac_f16': True, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': True, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': True, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': True, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (9, 0, 10): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': False, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': True, 'HasMFMA_constSrc': True, 'HasMFMA_vgpr': True, 'HasMFMA_f64': True, 'HasMFMA_bf16_original': True, 'HasMFMA_bf16_1k': True, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': True, 'HasMFMA_i8_940': False, 'v_mac_f16': True, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': True, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': True, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': True, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (9, 4, 0): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': False, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': True, 'HasMFMA_constSrc': True, 'HasMFMA_vgpr': True, 'HasMFMA_f64': True, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': True, 'HasMFMA_xf32': True, 'HasMFMA_f8': True, 'HasMFMA_b8': True, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': True, 'v_mac_f16': True, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': True, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': False, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': True, 'HasGLCModifier': False, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (9, 4, 1): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': False, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': True, 'HasMFMA_constSrc': True, 'HasMFMA_vgpr': True, 'HasMFMA_f64': True, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': True, 'HasMFMA_xf32': True, 'HasMFMA_f8': True, 'HasMFMA_b8': True, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': True, 'v_mac_f16': True, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': True, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': False, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': True, 'HasGLCModifier': False, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (9, 4, 2): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': False, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': True, 'HasMFMA_constSrc': True, 'HasMFMA_vgpr': True, 'HasMFMA_f64': True, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': True, 'HasMFMA_xf32': True, 'HasMFMA_f8': True, 'HasMFMA_b8': True, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': True, 'v_mac_f16': True, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': True, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': False, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': True, 'HasGLCModifier': False, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (10, 1, 0): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': True, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': False, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': False, 'v_dot2c_f32_f16': False, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': False, 'VOP3v_dot4_i32_i8': False, 'v_mac_f32': True, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': False, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (10, 1, 1): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': True, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': False, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': True, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': True, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': False, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (10, 1, 2): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': True, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': False, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': True, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': True, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': False, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (10, 3, 0): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': True, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': False, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': True, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': False, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': False, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (10, 3, 1): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': True, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': True, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': False, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': False, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': True, 'VOP3v_dot4_i32_i8': True, 'v_mac_f32': False, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': False, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (11, 0, 0): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': True, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': False, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': True, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': False, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': False, 'VOP3v_dot4_i32_i8': False, 'v_mac_f32': False, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': True, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (11, 0, 1): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': True, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': False, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': True, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': False, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': False, 'VOP3v_dot4_i32_i8': False, 'v_mac_f32': False, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': True, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (11, 0, 2): {'SupportedISA': True, 'HasExplicitCO': True, 'HasExplicitNC': True, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': False, 'HasAddLshl': True, 'HasLshlOr': True, 'HasSMulHi': True, 'HasWMMA': True, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': False, 'v_fma_f16': True, 'v_fmac_f16': False, 'v_pk_fma_f16': True, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': True, 'v_dot2_f32_f16': True, 'v_dot2c_f32_f16': True, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': False, 'VOP3v_dot4_i32_i8': False, 'v_mac_f32': False, 'v_fma_f32': True, 'v_fmac_f32': True, 'v_fma_f64': True, 'HasAtomicAdd': True, 'HasGLCModifier': True, 'MaxVmcnt': 63, 'MaxLgkmcnt': 15, 'SupportedSource': True}, - (0, 0, 0): {'SupportedISA': False, 'HasExplicitCO': False, 'HasExplicitNC': False, 'HasDirectToLdsDest': False, 'HasDirectToLdsNoDest': False, 'HasAddLshl': False, 'HasLshlOr': False, 'HasSMulHi': False, 'HasWMMA': False, 'HasMFMA': False, 'HasMFMA_constSrc': False, 'HasMFMA_vgpr': False, 'HasMFMA_f64': False, 'HasMFMA_bf16_original': False, 'HasMFMA_bf16_1k': False, 'HasMFMA_xf32': False, 'HasMFMA_f8': False, 'HasMFMA_b8': False, 'HasMFMA_i8_908': False, 'HasMFMA_i8_940': False, 'v_mac_f16': False, 'v_fma_f16': False, 'v_fmac_f16': False, 'v_pk_fma_f16': False, 'v_pk_fmac_f16': False, 'v_mad_mix_f32': False, 'v_fma_mix_f32': False, 'v_dot2_f32_f16': False, 'v_dot2c_f32_f16': False, 'v_dot4_i32_i8': False, 'v_dot4c_i32_i8': False, 'VOP3v_dot4_i32_i8': False, 'v_mac_f32': False, 'v_fma_f32': False, 'v_fmac_f32': False, 'v_fma_f64': False, 'HasAtomicAdd': False, 'HasGLCModifier': False, 'MaxVmcnt': 0, 'MaxLgkmcnt': 15, 'SupportedSource': True}, -} - def getArchitectureName(gfxName): if gfxName in architectureMap: return architectureMap[gfxName] @@ -1403,6 +1384,19 @@ def getArchitectureName(gfxName): # 0=none, 1=add setprio, 2=add setprio and modify LDS to allow only 2 waves/simd "AggressivePerfMode": [0,1,2], + # Use the feature whereby 56 bytes of kernel arguments can be preloaded in SGPRs + # before the kernel begins executing. This is currently only supported in cases + # where that is enough to initiate the first load of the A and B tensors before + # the remaining arguments have been loaded. + # -1: Use if it's supported (by the GPU and in combination with other features) + # 0: Don't use + # 1: Use, reject solution if not supported. + "PreloadKernelArguments": [-1, 0, 1], + + # If PreloadKernelArguments is 1, specifies whether we delay initiating the load + # of the remaining arguments until after the load of A and B has been initiated. + "DelayRemainingArguments": [False, True], + # Kernels should be written in assembly or source # if assembly, ISA will determine architecture # if source, Runtime will determine language @@ -1448,6 +1442,7 @@ def getArchitectureName(gfxName): {"InnerUnroll": [ 1 ] }, {"LocalDotLayout": [ 1 ] }, {"AggressivePerfMode": [ 1 ] }, + {"PreloadKernelArguments": [ 0 ] }, {"KernelLanguage": [ "Source" ] }, {"LdsPadA": [ -1 ] }, {"LdsPadB": [ -1 ] }, @@ -1597,7 +1592,7 @@ def getArchitectureName(gfxName): {"Fp16AltImplRound": [ False ] }, {"ThreadSeparateGlobalReadA": [ 0 ] }, {"ThreadSeparateGlobalReadB": [ 0 ] }, - {"MinKForGSU": [256]} + {"MinKForGSU": [256]}, ] # dictionary of defaults comprised of default option for each parameter @@ -2011,6 +2006,20 @@ def GetAsmCaps(isaVersion): # TODO- Need to query the max cap, just like vmcnt as well? derivedAsmCaps["MaxLgkmcnt"] = 15 + derivedAsmCaps["KernargPreloading"] = tryAssembler(isaVersion, """ + TestKernel: + s_endpgm + .amdhsa_kernel TestKernel + .amdhsa_next_free_vgpr 8 + .amdhsa_next_free_sgpr 4 + .amdhsa_group_segment_fixed_size 0 // lds bytes + .amdhsa_user_sgpr_kernarg_segment_ptr 1 + .amdhsa_user_sgpr_kernarg_preload_length 3 + .amdhsa_user_sgpr_kernarg_preload_offset 0 + .amdhsa_accum_offset 4 + .end_amdhsa_kernel + """) + derivedAsmCaps["SupportedSource"] = True ignoreCacheCheck = globalParameters["IgnoreAsmCapCache"] @@ -2321,6 +2330,14 @@ def assignGlobalParameters( config ): if globalParameters["PrintLevel"] >= 1: printCapTable(globalParameters) + if globalParameters["AsmCaps"] != CACHED_ASM_CAPS: + import pprint + print("ASM Caps differ from cache. New caps:") + print("####################") + print("CACHED_ASM_CAPS = \\\n") + pprint.pprint(globalParameters["AsmCaps"]) + print("####################") + globalParameters["SupportedISA"] = list([i for i in globalParameters["SupportedISA"] if globalParameters["AsmCaps"][i]["SupportedISA"]]) validParameters["ISA"] = [(0,0,0), *globalParameters["SupportedISA"]] diff --git a/Tensile/Components/Signature.py b/Tensile/Components/Signature.py index fef52d471..aa31ab044 100644 --- a/Tensile/Components/Signature.py +++ b/Tensile/Components/Signature.py @@ -60,7 +60,10 @@ def getDstValueType(kernel): class SignatureDefault(Signature): # Formats an argument to add to the header - def addArgument(self, name, size, offset, valueKind, valueType, AddrSpaceQual = None): + def addArgument(self, name, size, offset, valueKind, valueType = None, AddrSpaceQual = None): + self.offset += size + if valueType is None: + valueType = f"u{size*8}" kStr = "" kStr += " - .name: %s\n" % name kStr += " .size: %s\n" % size @@ -93,6 +96,21 @@ def __call__(self, writer): tWord = ".amdhsa_user_sgpr_kernarg_segment_ptr" kStr += " %s 1%s" % (tWord, writer.endLine) + supportsPreload = globalParameters["AsmCaps"][writer.version]["KernargPreloading"] + + numPreloaded = 0 + numUserSgprs = 2 + + if kernel["PreloadKernelArguments"] == 1: + numPreloaded = writer.sgprPool.numPreloadSGPRs + numUserSgprs += numPreloaded + + if supportsPreload: + kStr += f" .amdhsa_user_sgpr_kernarg_preload_offset 0{writer.endLine}" + kStr += f" .amdhsa_user_sgpr_kernarg_preload_length {numPreloaded}{writer.endLine}" + + kStr += f" .amdhsa_user_sgpr_count {numUserSgprs}{writer.endLine}" + # kern arg size kernArgReg = 0 kernArgReg += 3*writer.rpga @@ -173,12 +191,6 @@ def __call__(self, writer): kStr += writer.comment1("DirectToLdsB=%s" % kernel["DirectToLdsB"]) kStr += writer.comment1("UseSgprForGRO=%s" % kernel["_UseSgprForGRO"]) - srcValueTypeA = getSrcValueType(kernel, True) - srcValueTypeB = getSrcValueType(kernel, False) - dstValueType = getDstValueType(kernel) - cptValueType = kernel["ProblemType"]["ComputeDataType"].toNameAbbrev() - cptByte = kernel["ProblemType"]["ComputeDataType"].numBytes() - kStr += ".amdgpu_metadata\n" kStr += "---\n" kStr += "amdhsa.version:\n" @@ -198,122 +210,14 @@ def __call__(self, writer): kStr += " - 2%s" % writer.endLine kStr += " - 0%s" % writer.endLine kStr += " .args:%s" % writer.endLine - offset = 0 + self.offset = 0 - if globalParameters["DebugKernel"]: - kStr += self.addArgument( 'AddressDbg', '8', offset, "global_buffer","struct", "generic"); offset += 8 - - kStr += self.addArgument( 'sizeC', '8', offset, "by_value", "u64"); offset += 8 - kStr += self.addArgument( 'sizeA', '8', offset, "by_value", "u64"); offset += 8 - kStr += self.addArgument( 'sizeB', '8', offset, "by_value", "u64"); offset += 8 - - kStr += self.addArgument( 'D', '8', offset, "global_buffer", dstValueType, "generic"); offset += 8 - kStr += self.addArgument( 'C', '8', offset, "global_buffer", dstValueType, "generic"); offset += 8 - kStr += self.addArgument( 'A', '8', offset, "global_buffer", srcValueTypeA, "generic"); offset += 8 - kStr += self.addArgument( 'B', '8', offset, "global_buffer", srcValueTypeB, "generic"); offset += 8 - if kernel["StreamK"] == 2 or kernel["StreamK"] == 3: - kStr += self.addArgument( 'WS', '8', offset, "global_buffer", dstValueType, "generic"); offset += 8 - kStr += self.addArgument( 'Flags', '8', offset, "global_buffer", dstValueType, "generic"); offset += 8 - - if not kernel["ProblemType"]["StridedBatched"]: - kStr += self.addArgument("OffsetD", '8', offset, "by_value", "u64"); offset += 8 - kStr += self.addArgument("OffsetC", '8', offset, "by_value", "u64"); offset += 8 - kStr += self.addArgument("OffsetA", '8', offset, "by_value", "u64"); offset += 8 - kStr += self.addArgument("OffsetB", '8', offset, "by_value", "u64"); offset += 8 - - useSize = max(4, cptByte) - kStr += self.addArgument( "alpha", useSize, offset, "by_value", cptValueType); offset += useSize - if kernel["ProblemType"]["UseBeta"]: - kStr += self.addArgument( "beta", useSize, offset, "by_value", cptValueType); offset += useSize - - for i in range(0, writer.numSgprStridesD): - kStr += self.addArgument( "strideD%u"%i, '4', offset, "by_value", "u32"); offset += 4 - - for i in range(0, writer.numSgprStridesC): - kStr += self.addArgument( "strideC%u"%i, '4', offset, "by_value", "u32"); offset += 4 - - for i in range(0, writer.numSgprStridesA): - kStr += self.addArgument( "strideA%u"%i, '4', offset, "by_value", "u32"); offset += 4 - - for i in range(0, writer.numSgprStridesB): - kStr += self.addArgument( "strideB%u"%i, '4', offset, "by_value", "u32"); offset += 4 - - for i in range(0, writer.numSgprSizesFree): - kStr += self.addArgument( "SizesFree%u"%i, '4', offset, "by_value", "u32"); offset += 4 - - for i in range(0, writer.numSgprSizesSum): - kStr += self.addArgument( "SizesSum%u"%i, '4', offset, "by_value", "u32"); offset += 4 - - for magicName in writer.sumMagicParms: - kStr += self.addArgument( "MagicNumberSize%s"%magicName, '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "MagicShiftSize%s"%magicName, '4', offset, "by_value", "u32"); offset += 4 - - for idxChar in kernel["PackedC0IdxChars"][:-1]: - kStr += self.addArgument( "MagicNumberSize%s"%idxChar, '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "MagicShiftSize%s"%idxChar, '4', offset, "by_value", "u32"); offset += 4 - - for idxChar in kernel["PackedC1IdxChars"][:-1]: - kStr += self.addArgument( "MagicNumberSize%s"%idxChar, '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "MagicShiftSize%s"%idxChar, '4', offset, "by_value", "u32"); offset += 4 - - for idx in kernel["ProblemType"]["IndicesSummation"]: - for tc in ('A','B'): - for zp in kernel["ProblemType"]["ZeroPad%s"%tc]: - (freeDim, sumDim, padStart, padEnd) = zp - if sumDim == idx: - freeDimChar = globalParameters["IndexChars"][freeDim] - sumDimChar = globalParameters["IndexChars"][sumDim] - # These will eventually be read as kernel args: - kStr += self.addArgument( "PadStart%s%s%s"%(tc, freeDimChar, sumDimChar), '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "PadEnd%s%s%s"%(tc, freeDimChar, sumDimChar), '4', offset, "by_value", "u32"); offset += 4 - - kStr += self.addArgument( "OrigStaggerUIter", '4', offset, "by_value", "i32"); offset += 4 - - kStr += self.addArgument( "NumWorkGroups0", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "NumWorkGroups1", '4', offset, "by_value", "u32"); offset += 4 - - if kernel["StreamK"]: - kStr += self.addArgument("MagicNumberProblemNumGroupTiles0", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument("MagicShiftProblemNumGroupTiles0", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument("MagicNumProblemNumGroupTiles0By1", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument("MagicShiftProblemNumGroupTiles0By1", '4', offset, "by_value", "u32"); offset += 4 - - if kernel["PersistentKernel"]: - kStr += self.addArgument("MagicNumberProblemNumGroupTiles0", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument("MagicShiftProblemNumGroupTiles0", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "GridNumWorkGroups0", '4', offset, "by_value", "u32"); offset += 4 - if kernel["PersistentKernelAlongBatch"]: - kStr += self.addArgument( "NumWorkGroups2", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument("MagicNumProblemNumGroupTiles0By1", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument("MagicShiftProblemNumGroupTiles0By1", '4', offset,"by_value", "u32"); offset += 4 - - if kernel["StreamK"]: - kStr += self.addArgument("ItersPerTile", '4', offset,"by_value", "u32"); offset += 4 - kStr += self.addArgument("MagicNumberItersPerTile", '4', offset,"by_value", "u32"); offset += 4 - kStr += self.addArgument("MagicShiftItersPerTile", '4', offset,"by_value", "u32"); offset += 4 - kStr += self.addArgument("TotalIters", '4', offset,"by_value", "u32"); offset += 4 - kStr += self.addArgument("SKItersPerWG", '4', offset,"by_value", "u32"); offset += 4 - if kernel["StreamK"] == 3: # Two-tile SK - kStr += self.addArgument("skGrid", '4', offset,"by_value", "u32"); offset += 4 - kStr += self.addArgument("skTiles", '4', offset,"by_value", "u32"); offset += 4 - kStr += self.addArgument("skExtraIters", '4', offset,"by_value", "u32"); offset += 4 - # kStr += self.addArgument("dpTilesPerWG", '4', offset,"by_value", "u32"); offset += 4 - - if abs(kernel["WorkGroupMapping"]) > 1: - kStr += self.addArgument( "NumFullBlocks", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "WgmRemainder1", '4', offset, "by_value", "u32"); offset += 4 - kStr += self.addArgument( "MagicNumberWgmRemainder1", '4', offset, "by_value", "u32"); offset += 4 - - # for in-device stochastic rounding, iwe need to pass Seed - # TODO: if kernel["ProblemType"]["StochasticRounding"] == 1: # in-device - if kernel["ProblemType"]["StochasticRounding"]: # in-device - kStr += self.addArgument("RNDSeed", '4', offset, "by_value", "u32"); offset += 4 - - kStr += self.addArgument( "padding", '4', offset, "by_value", "u32"); offset += 4 + for arg in writer.sgprPool.kernargs: + kStr += self.addArgument(name=arg['name'], size=arg['size']*4, offset=self.offset, valueKind="by_value") kStr += " .group_segment_fixed_size: %u%s" % ( group_segment_size, writer.endLine ) #XXXXXX kStr += " .kernarg_segment_align: %u%s" % ( 8, writer.endLine ) - kStr += " .kernarg_segment_size: %u%s" % (((offset+7)//8)*8, writer.endLine) # round up to .kernarg_segment_align + kStr += " .kernarg_segment_size: %u%s" % (((self.offset+7)//8)*8, writer.endLine) # round up to .kernarg_segment_align kStr += " .max_flat_workgroup_size: %u%s" % ( kernel["SubGroup0"] * kernel["SubGroup1"] * kernel["LocalSplitU"], writer.endLine ) kStr += " .private_segment_fixed_size: %u%s" % ( 0, writer.endLine ) kStr += " .sgpr_count: %u%s" % ( totalSgprs, writer.endLine ) diff --git a/Tensile/Contractions.py b/Tensile/Contractions.py index 79e8f160d..b613cabe3 100644 --- a/Tensile/Contractions.py +++ b/Tensile/Contractions.py @@ -464,6 +464,7 @@ class SizeMapping: 'sourceKernel', 'globalAccumulation', 'workspaceSizePerElemC', + 'preloadKernargs' ] @classmethod @@ -475,6 +476,8 @@ def FromOriginalState(cls, d): globalAccum = 2 if d['_GlobalAccumulation'] == 'PartialsBuffer': globalAccum = 3 + + assert d["PreloadKernelArguments"] in (0, 1), d["PreloadKernelArguments"] return cls(workGroup = d['WorkGroup'], macroTile = cls.ReadOriginalMacroTile(d), threadTile = d['ThreadTile'], @@ -492,6 +495,7 @@ def FromOriginalState(cls, d): sourceKernel = d['KernelLanguage'] == 'Source', globalAccumulation = globalAccum, workspaceSizePerElemC = d['_WorkspaceSizePerElemC'], + preloadKernargs = d["PreloadKernelArguments"] ) @classmethod diff --git a/Tensile/CustomKernels/DGEMM_Aldebaran_NN_MT128x128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s b/Tensile/CustomKernels/DGEMM_Aldebaran_NN_MT128x128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s index 6199997f3..0fc84c922 100644 --- a/Tensile/CustomKernels/DGEMM_Aldebaran_NN_MT128x128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s +++ b/Tensile/CustomKernels/DGEMM_Aldebaran_NN_MT128x128x16_MI16x16x4x1_GRVW2_SU4_SUS128_WGM4.s @@ -716,9 +716,9 @@ s_mov_b32 m0, 0x9000 // LDS clamp at 36864 bytes v_mov_b32 v[vgprSerial], v0 // thread serial id /* Load Kernel Args */ -s_load_dwordx16 s[24:39], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x8 // -s_load_dwordx16 s[48:63], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x48 // -s_load_dwordx2 s[64:65], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x88 // +s_load_dwordx16 s[24:39], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x0 // +s_load_dwordx16 s[48:63], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x40 // +s_load_dwordx2 s[64:65], s[sgprKernArgAddress:sgprKernArgAddress+1], 0x80 // s_waitcnt lgkmcnt(0) // wait for 160 bytes of kern args s_mov_b32 s44, s36 s_mov_b32 s45, s37 diff --git a/Tensile/KernelWriter.py b/Tensile/KernelWriter.py index 5e31fb5a2..7295092a2 100644 --- a/Tensile/KernelWriter.py +++ b/Tensile/KernelWriter.py @@ -3694,7 +3694,9 @@ def comment3(self, text): @abc.abstractmethod def initKernel(self, kernel, tensorParametersA, tensorParametersB ): - self.staggerU = kernel["StaggerU"] and (kernel["KernelLanguage"]=="Source" or kernel["BufferLoad"]) + self.staggerU = kernel["StaggerU"] + if self.staggerU: + assert (kernel["KernelLanguage"]=="Source" or kernel["BufferLoad"]) self.tPA = tensorParametersA self.tPB = tensorParametersB diff --git a/Tensile/KernelWriterAssembly.py b/Tensile/KernelWriterAssembly.py index c48d33f3a..235f6b316 100644 --- a/Tensile/KernelWriterAssembly.py +++ b/Tensile/KernelWriterAssembly.py @@ -219,6 +219,21 @@ def laneSGPRCount(self) -> int: else: return 1 + @property + def rpga(self) -> int: + """ (2) registers per global address (64-bit) """ + return 2 + + @property + def rpla(self): + """ (1) registers per local address (32-bit) """ + return 1 + + @property + def rpgo(self): + """ (1) registers per global 32-bit offset (some intructions only support 32-bit offset) """ + return 1 + def getCompileArgs(self, sourceFileName, objectFileName, *moreArgs, isa=None, wavefrontSize=None): if isa is None: isa = self.version @@ -534,10 +549,26 @@ def getTmpSgpr(self, num, align=None, tag=None): assert(t.idx()+num <= self.maxSgprs) return t - def defineSgpr(self, name, numSgprs, align=1): + def definePreloadedSgprPool(self, numSgprs): + self.sgprPool.add(self.sgprPool.size(), numSgprs, newStatus = RegisterPool.Status.AvailableForPreload) + + def defineSgpr(self, name, numSgprs, align=1, kernarg=None, preload=False): if numSgprs == 0: return + if kernarg is None: + kernarg = preload + + if self.kernel["PreloadKernelArguments"] != 1: + preload = False + + sgprIdx = self.sgprPool.checkOutAligned(numSgprs, align, tag=name, preventOverflow=False, kernarg=kernarg, preload=preload) - sgprIdx = self.sgprPool.checkOutAligned(numSgprs, align, tag=name, preventOverflow=0) + if preload: + self.preloadedKernargs[0] = min(sgprIdx, self.preloadedKernargs[0]) + self.preloadedKernargs[1] = max(sgprIdx+numSgprs, self.preloadedKernargs[1]) + elif kernarg: + self.loadedKernargs[0] = min(sgprIdx, self.loadedKernargs[0]) + self.loadedKernargs[1] = max(sgprIdx+numSgprs, self.loadedKernargs[1]) + #self.sgprIdx = roundUpToNearestMultiple(self.sgprIdx,align) #print (name, "->", self.sgprIdx, "+", numSgprs) self.sgprs[name] = sgprIdx @@ -717,6 +748,9 @@ def initKernel(self, kernel, tPA, tPB ): tPB["localReadOffset"] = 0 self.sgprs=collections.OrderedDict() + self.preloadedSgprs = collections.OrderedDict() + self.loadedKernargs = [1000000, -1] + self.preloadedKernargs = [1000000, -1] self.LdsOOB = 0xF00000 @@ -1064,12 +1098,6 @@ def initKernel(self, kernel, tPA, tPB ): assert self.bpeAB == tPA["bpe"] assert self.bpeAB == tPB["bpe"] - # registers per global address - self.rpga = 2 # 64-bit - # registers per local address - self.rpla = 1 # 32-bit - # registers per global 32-bit offset (some intructions only support 32-bit offset) - self.rpgo = 1 # 32-bit #################################### # choose memory instructions @@ -1764,6 +1792,8 @@ def initKernel(self, kernel, tPA, tPB ): ######################################## self.defineSgpr("KernArgAddress", self.rpga) assert(self.sgprs["KernArgAddress"] == 0) # kernarg is passed to kernel as SGPR0 + if self.kernel["PreloadKernelArguments"] == 1: + self.definePreloadedSgprPool(14) #if kernel["WorkGroupMapping"]>=0 : # self.defineSgpr("WorkGroup0", 1) @@ -1853,49 +1883,37 @@ def initKernel(self, kernel, tPA, tPB ): ################################### # Get kernel argument start here - self.defineSgpr("Tensor2dSizeA", 2,4) - # fill empty Sgpr slot caused by Sgpr alignment, - # because we need following defineSgpr use continuous sgpr - SgprSlot = [] - currentSize = self.sgprPool.size() - while (1): - tempSgpr = self.sgprPool.checkOut(1,"fill empty slot temporarily",preventOverflow=0) - if tempSgpr >= currentSize: - self.sgprPool.checkIn(tempSgpr) - break - SgprSlot.append(tempSgpr) - self.defineSgpr("Tensor2dSizeB", 2, 2) + self.defineSgpr("Tensor2dSizeA", 2, (2 if kernel["PreloadKernelArguments"] == 1 else 4), preload=True) + self.defineSgpr("Tensor2dSizeB", 2, 2, preload=True) self.argAddressOffset = 6 * 4 # 8 bytes C, A, B - self.defineSgpr("AddressD", numSgprAddressD) - self.defineSgpr("AddressC", numSgprAddressC) - self.defineSgpr("AddressA", numSgprAddressA) - self.defineSgpr("AddressB", numSgprAddressB) - self.argOffsetOffset = self.argAddressOffset + (numSgprAddressD + numSgprAddressC + numSgprAddressA + numSgprAddressB) * 4 + self.defineSgpr("AddressD", numSgprAddressD, kernarg=True) + self.defineSgpr("AddressC", numSgprAddressC, kernarg=True) + self.defineSgpr("AddressA", numSgprAddressA, preload=True) + self.defineSgpr("AddressB", numSgprAddressB, preload=True) if kernel["StreamK"] == 2 or kernel["StreamK"] == 3: - self.defineSgpr("AddressWS", numSgprAddressWS) - self.defineSgpr("AddressFlags", numSgprAddressFlags) - self.argOffsetOffset += (numSgprAddressWS + numSgprAddressFlags) * 4 + self.defineSgpr("AddressWS", numSgprAddressWS, kernarg=True) + self.defineSgpr("AddressFlags", numSgprAddressFlags, kernarg=True) if not kernel["ProblemType"]["StridedBatched"]: self.numSgprOffsetD = 2 self.numSgprOffsetC = 2 self.numSgprOffsetA = 2 self.numSgprOffsetB = 2 - self.defineSgpr("OffsetD", self.numSgprOffsetD) - self.defineSgpr("OffsetC", self.numSgprOffsetC) - self.defineSgpr("OffsetA", self.numSgprOffsetA) - self.defineSgpr("OffsetB", self.numSgprOffsetB) + self.defineSgpr("OffsetD", self.numSgprOffsetD, kernarg=True) + self.defineSgpr("OffsetC", self.numSgprOffsetC, kernarg=True) + self.defineSgpr("OffsetA", self.numSgprOffsetA, kernarg=True) + self.defineSgpr("OffsetB", self.numSgprOffsetB, kernarg=True) - self.defineSgpr("Alpha", numSgprAlpha, numSgprAlpha) + self.defineSgpr("Alpha", numSgprAlpha, numSgprAlpha, preload=True) if kernel["ProblemType"]["UseBeta"]: - self.defineSgpr("Beta", numSgprBeta, numSgprBeta) - self.defineSgpr("StridesD", self.numSgprStridesD) - self.defineSgpr("StridesC", self.numSgprStridesC) - self.defineSgpr("StridesA", self.numSgprStridesA) - self.defineSgpr("StridesB", self.numSgprStridesB) - self.defineSgpr("SizesFree", self.numSgprSizesFree) - self.defineSgpr("SizesSum", self.numSgprSizesSum) + self.defineSgpr("Beta", numSgprBeta, numSgprBeta, kernarg=True) + self.defineSgpr("StridesD", self.numSgprStridesD, kernarg=True) + self.defineSgpr("StridesC", self.numSgprStridesC, kernarg=True) + self.defineSgpr("StridesA", self.numSgprStridesA, preload=True) + self.defineSgpr("StridesB", self.numSgprStridesB, preload=True) + self.defineSgpr("SizesFree", self.numSgprSizesFree, kernarg=True) + self.defineSgpr("SizesSum", self.numSgprSizesSum, preload=True) self.sumMagicParms = [] if kernel["PackSummationDims"]: @@ -1904,17 +1922,17 @@ def initKernel(self, kernel, tPA, tPB ): if kernel["PackSummationDims"] and kernel["GlobalSplitU"] > 1 and self.sumMagicParms: self.sumMagicParms.append("%s_GsuRemainder"%self.unrollChar) for magicName in self.sumMagicParms: - self.defineSgpr("MagicNumberSize%s"%magicName, 1) - self.defineSgpr("MagicShiftSize%s"%magicName, 1) + self.defineSgpr("MagicNumberSize%s"%magicName, 1, kernarg=True) + self.defineSgpr("MagicShiftSize%s"%magicName, 1, kernarg=True) # for packed batches without stride restrictions need to do something different here assert sorted(kernel["PackedC0IdxChars"]+kernel["PackedC1IdxChars"]) == \ sorted(set(kernel["PackedC0IdxChars"]+kernel["PackedC1IdxChars"])) for idxChar in kernel["PackedC0IdxChars"][:-1]: - self.defineSgpr("MagicNumberSize%s"%idxChar, 1) - self.defineSgpr("MagicShiftSize%s"%idxChar, 1) + self.defineSgpr("MagicNumberSize%s"%idxChar, 1, kernarg=True) + self.defineSgpr("MagicShiftSize%s"%idxChar, 1, kernarg=True) for idxChar in kernel["PackedC1IdxChars"][:-1]: - self.defineSgpr("MagicNumberSize%s"%idxChar, 1) - self.defineSgpr("MagicShiftSize%s"%idxChar, 1) + self.defineSgpr("MagicNumberSize%s"%idxChar, 1, kernarg=True) + self.defineSgpr("MagicShiftSize%s"%idxChar, 1, kernarg=True) for idx in kernel["ProblemType"]["IndicesSummation"]: for tc in ('A','B'): for zp in kernel["ProblemType"]["ZeroPad%s"%tc]: @@ -1923,41 +1941,42 @@ def initKernel(self, kernel, tPA, tPB ): freeDimChar = globalParameters["IndexChars"][freeDim] sumDimChar = globalParameters["IndexChars"][sumDim] # These will eventually be read as kernel args: - self.defineSgpr("PadStart%s%s%s"%(tc, freeDimChar, sumDimChar),1) - self.defineSgpr("PadEnd%s%s%s"%(tc, freeDimChar, sumDimChar),1) - self.defineSgpr("OrigStaggerUIter", 1) # Original stagger register. Only needed for Persistent - self.defineSgpr("NumWorkGroups0", 1) - self.defineSgpr("NumWorkGroups1", 1) + self.defineSgpr("PadStart%s%s%s"%(tc, freeDimChar, sumDimChar),1, kernarg=True) + self.defineSgpr("PadEnd%s%s%s"%(tc, freeDimChar, sumDimChar),1, kernarg=True) + if self.staggerU: + self.defineSgpr("OrigStaggerUIter", 1, kernarg=True) # Original stagger register. Only needed for Persistent + self.defineSgpr("NumWorkGroups0", 1, kernarg=True) + self.defineSgpr("NumWorkGroups1", 1, kernarg=True) pkArgumentToLoad = 0 if kernel["PersistentKernel"]: - self.defineSgpr("MagicNumberProblemNumGroupTiles0", 1) # Magic number to use for division - self.defineSgpr("MagicShiftProblemNumGroupTiles0", 1) # Magic shift/abit to use for division alg 2 - self.defineSgpr("GridNumWorkGroups0", 1) # Magic number to use for division, persistent kernel - flattened wg0 (=all WGs) + self.defineSgpr("MagicNumberProblemNumGroupTiles0", 1, kernarg=True) # Magic number to use for division + self.defineSgpr("MagicShiftProblemNumGroupTiles0", 1, kernarg=True) # Magic shift/abit to use for division alg 2 + self.defineSgpr("GridNumWorkGroups0", 1, kernarg=True) # Magic number to use for division, persistent kernel - flattened wg0 (=all WGs) pkArgumentToLoad += 3 if kernel["PersistentKernelAlongBatch"]: - self.defineSgpr("NumWorkGroups2", 1) # for persistent kernel along batch - self.defineSgpr("MagicNumProblemNumGroupTiles0By1", 1) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) - self.defineSgpr("MagicShiftProblemNumGroupTiles0By1", 1) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) + self.defineSgpr("NumWorkGroups2", 1, kernarg=True) # for persistent kernel along batch + self.defineSgpr("MagicNumProblemNumGroupTiles0By1", 1, kernarg=True) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) + self.defineSgpr("MagicShiftProblemNumGroupTiles0By1", 1, kernarg=True) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) pkArgumentToLoad += 3 skArgumentToLoad = 0 if kernel["StreamK"]: # StreamK args - self.defineSgpr("MagicNumberProblemNumGroupTiles0", 1) # Magic number to use for division - self.defineSgpr("MagicShiftProblemNumGroupTiles0", 1) # Magic shift/abit to use for division alg 2 - self.defineSgpr("ItersPerTile", 1) - self.defineSgpr("MagicNumberItersPerTile", 1) - self.defineSgpr("MagicShiftItersPerTile", 1) - self.defineSgpr("MagicNumProblemNumGroupTiles0By1", 1) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) - self.defineSgpr("MagicShiftProblemNumGroupTiles0By1", 1) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) - self.defineSgpr("TotalIters", 1) - self.defineSgpr("SKItersPerWG", 1) + self.defineSgpr("MagicNumberProblemNumGroupTiles0", 1, kernarg=True) # Magic number to use for division + self.defineSgpr("MagicShiftProblemNumGroupTiles0", 1, kernarg=True) # Magic shift/abit to use for division alg 2 + self.defineSgpr("ItersPerTile", 1, kernarg=True) + self.defineSgpr("MagicNumberItersPerTile", 1, kernarg=True) + self.defineSgpr("MagicShiftItersPerTile", 1, kernarg=True) + self.defineSgpr("MagicNumProblemNumGroupTiles0By1", 1, kernarg=True) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) + self.defineSgpr("MagicShiftProblemNumGroupTiles0By1", 1, kernarg=True) # for PKAB, use for Magic Div Alg 2 by (nwg0*nwg1) + self.defineSgpr("TotalIters", 1, kernarg=True) + self.defineSgpr("SKItersPerWG", 1, kernarg=True) skArgumentToLoad += 9 if kernel["StreamK"] == 3: # Two-tile SK - self.defineSgpr("skGrid", 1) - self.defineSgpr("skTiles", 1) - self.defineSgpr("skExtraIters", 1) - # self.defineSgpr("dpTilesPerWG", 1) + self.defineSgpr("skGrid", 1, kernarg=True) + self.defineSgpr("skTiles", 1, kernarg=True) + self.defineSgpr("skExtraIters", 1, kernarg=True) + # self.defineSgpr("dpTilesPerWG", 1, kernarg=True) skArgumentToLoad += 3 @@ -1971,14 +1990,16 @@ def initKernel(self, kernel, tPA, tPB ): self.numSgprWGM = 0 if abs(kernel["WorkGroupMapping"]) > 1: self.numSgprWGM = 3 - self.defineSgpr("NumFullBlocks", 1) # Magic number to use for div by (NumWorkGroups1 % WGM) - self.defineSgpr("WgmRemainder1", 1) # Magic number to use for div by (NumWorkGroups1 % WGM) - self.defineSgpr("MagicNumberWgmRemainder1", 1) # Magic number to use for div by (NumWorkGroups1 % WGM) + self.defineSgpr("NumFullBlocks", 1, kernarg=True) # Magic number to use for div by (NumWorkGroups1 % WGM) + self.defineSgpr("WgmRemainder1", 1, kernarg=True) # Magic number to use for div by (NumWorkGroups1 % WGM) + self.defineSgpr("MagicNumberWgmRemainder1", 1, kernarg=True) # Magic number to use for div by (NumWorkGroups1 % WGM) # SR only for F8 type if kernel["ProblemType"]["DataType"].is8bitFloat(): if kernel["ProblemType"]["StochasticRounding"]: # in-device, only RNDSeed - self.defineSgpr("RNDSeed", 1) # seed for random number generation + self.defineSgpr("RNDSeed", 1, kernarg=True) # seed for random number generation + + #---- if self.isInitCodeOptLW: # init code optimization: define PerpOverhangVccA, B just after kernel args (need this before undef OFFSET) @@ -1993,37 +2014,17 @@ def initKernel(self, kernel, tPA, tPB ): if kernel["LocalWriteUseSgprB"]: self.defineSgpr("LocalWriteAddrB", 1) - self.numSgprToLoad = 2 + 2 + numSgprAddressD + numSgprAddressC + numSgprAddressA + numSgprAddressB + \ - ((numSgprAddressWS + numSgprAddressFlags) if kernel["StreamK"] >= 2 else 0) + \ - numSgprAlpha + \ - (numSgprBeta if kernel["ProblemType"]["UseBeta"] else 0) + self.numSgprStridesD + self.numSgprStridesC + self.numSgprStridesA + \ - self.numSgprStridesB + self.numSgprSizesFree + self.numSgprSizesSum + \ - len(self.sumMagicParms)*2 + len(kernel["PackedC0IdxChars"][:-1])*2 + \ - len(kernel["PackedC1IdxChars"][:-1])*2 + len(kernel["ProblemType"]["ZeroPadA"])*2 + len(kernel["ProblemType"]["ZeroPadB"])*2 + \ - 1 + \ - 2 + \ - pkArgumentToLoad + \ - skArgumentToLoad + \ - self.numSgprWGM + \ - self.numSgprOffsetD + self.numSgprOffsetC + self.numSgprOffsetA + self.numSgprOffsetB - - # SR only for F8 type - if kernel["ProblemType"]["DataType"].is8bitFloat(): - if kernel["ProblemType"]["StochasticRounding"]: # in-device, only RNDSeed - self.numSgprToLoad += 1 - - self.argOffsetOffset = (self.numSgprToLoad + 2 - (self.numSgprOffsetD + self.numSgprOffsetC + self.numSgprOffsetA + self.numSgprOffsetB)) * 4 + self.numSgprToLoad = self.sgprPool.numKernargSGPRs + if not kernel["ProblemType"]["StridedBatched"]: + offsetD = self.sgprs["OffsetD"] + self.argOffsetOffset = (offsetD - self.sgprPool.kernargStart) * 4 + assert self.sgprs["OffsetC"] == offsetD + 2 + assert self.sgprs["OffsetA"] == offsetD + 4 + assert self.sgprs["OffsetB"] == offsetD + 6 # Get kernel argument end here ################################### - # put unused Sgpr back to SgprPool - while SgprSlot: - tempSgpr = SgprSlot.pop(0) - self.sgprPool.checkIn(tempSgpr) - if not self.staggerU: - self.undefineSgpr("OrigStaggerUIter") # Original stagger register. Only needed for Persistent - ######################################## # Register Pools ######################################## @@ -2164,8 +2165,11 @@ def initKernel(self, kernel, tPA, tPB ): ############################################################################## # format macro - def macroRegister(self, name, value): - return ".set %s, %s%s" % (name, value, self.endLine) + def macroRegister(self, name, value, comment=""): + if comment != "": + assert '\n' not in comment, comment + comment = " // " + comment + return f".set {name}, {value}{comment}{self.endLine}" ############################################################################## @@ -2771,7 +2775,9 @@ def functionSignature(self, kernel ): # Emit declarations for all sgprs allocated with defineSgpr # in the order they were declared for skey in self.sgprs: - kStr += self.macroRegister("sgpr"+skey, self.sgprs[skey]) + regNum = self.sgprs[skey] + count = self.sgprPool.checkOutSizeCache[skey] if skey in self.sgprPool.checkOutSizeCache else "unk" + kStr += self.macroRegister("sgpr"+skey, regNum, f"({count})") kStr += self.comment1("max SGPR=%u"%self.sgprPool.size()) kStr += "\n" @@ -3299,10 +3305,77 @@ def loadBatchedAddress(self, kernel, Batch, tmpSgpr): return kStr + ######################################## + # load kernel args + def loadKernelArguments(self): + kStr = "" + + kStr += self.comment("Load Kernel Args") + self.kernArgOffset = 0 + if self.kernel["PreloadKernelArguments"] == 1: + self.kernArgOffset = self.sgprPool.numPreloadSGPRs * 4 + + if globalParameters["DebugKernel"]: + kStr += self.getKernArg("AddressDbg") + kStr += self.getKernArg("AddressDbg+1") + + load = self.numSgprToLoad + sgprStart = self.sgprPool.kernargStart + while load > 0: + if load >= 16: + load -= 16 + kStr += inst("_s_load_b512", sgpr(sgprStart,16), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") + sgprStart += 16 + self.kernArgOffset += 16 * 4 + continue + if load >= 8: + load -= 8 + kStr += inst("_s_load_b256", sgpr(sgprStart,8), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") + sgprStart += 8 + self.kernArgOffset += 8 * 4 + continue + if load >= 4: + load -= 4 + kStr += inst("_s_load_b128", sgpr(sgprStart,4), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") + sgprStart += 4 + self.kernArgOffset += 4 * 4 + continue + if load >= 2: + load -= 2 + kStr += inst("_s_load_b64", sgpr(sgprStart,2), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") + sgprStart += 2 + self.kernArgOffset += 2 * 4 + continue + if load >= 1: + load -= 1 + kStr += inst("_s_load_b32", sgpr(sgprStart), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") + sgprStart += 1 + self.kernArgOffset += 1 * 4 + continue + # currently align sgpr to kernel argument memory, and use s_load_bxxx to load argument as large as possible in one instruction + # however, in order to match sgpr to kernel argument memory, some unnecessarily sgpr will also be defined, and caused wasting of sgpr. + # TODO: more efficient way is to organize both sgpr and kernel argument memory in API + + # KernArgAddress needed for general batch after loading arguments + if self.kernel["ProblemType"]["StridedBatched"] or not self.kernel["ProblemType"]["Batched"]: + self.undefineSgpr("KernArgAddress") + + return kStr + ############################################################################## def allocateResources(self, kernel, lraCode=None): kStr = "" + if kernel["PreloadKernelArguments"] == 1: + kStr += self.comment("256 bytes of s_nop") + for i in range(64): + kStr += inst("s_nop 0", "preload") + + kStr += self.comment("256 bytes of s_nop") + kStr += "\n" + kStr += f"{self.kernelName}_preloaded: // Kernel start when preloading\n" + + if kernel["StorePriorityOpt"]: kStr += inst("s_setprio 3", "optimization store") @@ -3333,57 +3406,8 @@ def allocateResources(self, kernel, lraCode=None): if self.kernel["WavefrontSize"] == 32: kStr += inst("s_mov_b32", "vcc_hi", "0", "Ensure hi bits are zero") - ######################################## - # load kernel args - kStr += self.comment("Load Kernel Args") - self.kernArgOffset = 0 - if globalParameters["DebugKernel"]: - kStr += self.getKernArg("AddressDbg") - kStr += self.getKernArg("AddressDbg+1") - - kStr += self.getKernArg("Tensor2dSizeC+0",0) - kStr += self.getKernArg("Tensor2dSizeC+1",0) - - load = self.numSgprToLoad - sgprStart = self.sgprs["Tensor2dSizeA"] - while load > 0: - if load >= 16: - load -= 16 - kStr += inst("_s_load_b512", sgpr(sgprStart,16), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") - sgprStart += 16 - self.kernArgOffset += 16 * 4 - continue - if load >= 8: - load -= 8 - kStr += inst("_s_load_b256", sgpr(sgprStart,8), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") - sgprStart += 8 - self.kernArgOffset += 8 * 4 - continue - if load >= 4: - load -= 4 - kStr += inst("_s_load_b128", sgpr(sgprStart,4), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") - sgprStart += 4 - self.kernArgOffset += 4 * 4 - continue - if load >= 2: - load -= 2 - kStr += inst("_s_load_b64", sgpr(sgprStart,2), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") - sgprStart += 2 - self.kernArgOffset += 2 * 4 - continue - if load >= 1: - load -= 1 - kStr += inst("_s_load_b32", sgpr(sgprStart), sgpr("KernArgAddress",2), hex(self.kernArgOffset), "") - sgprStart += 1 - self.kernArgOffset += 1 * 4 - continue - # currently align sgpr to kernel argument memory, and use s_load_bxxx to load argument as large as possible in one instruction - # however, in order to match sgpr to kernel argument memory, some unnecessarily sgpr will also be defined, and caused wasting of sgpr. - # TODO: more efficient way is to organize both sgpr and kernel argument memory in API - - # KernArgAddress needed for general batch after loading arguments - if kernel["ProblemType"]["StridedBatched"] or not kernel["ProblemType"]["Batched"]: - self.undefineSgpr("KernArgAddress") + if not self.kernel["DelayRemainingArguments"]: + kStr += self.loadKernelArguments() if kernel.enabledSetPrioSplitLDS: kStr += inst("s_setprio", "1", "prioritize init code so as to issue load sooner") @@ -3393,7 +3417,9 @@ def allocateResources(self, kernel, lraCode=None): if lraCode != None : kStr += lraCode - kStr += inst("s_waitcnt", "lgkmcnt(0)", "wait for %u bytes of kern args" % self.kernArgOffset ) + if kernel["PreloadKernelArguments"] != 1: + kernArgBytes = self.sgprPool.numKernargSGPRs * 4 + kStr += inst("s_waitcnt", "lgkmcnt(0)", "wait for %u bytes of kern args" % kernArgBytes ) if not kernel["ProblemType"]["StridedBatched"]: tmpSgpr = self.getTmpSgpr(self.laneSGPRCount).idx() @@ -3422,7 +3448,7 @@ def allocateResources(self, kernel, lraCode=None): self.releaseSgprAdressAB = True self.sgprAddressStrAB = "Srd" # C,D check - if kernel["BufferStore"] and kernel["PrefetchGlobalRead"]: + if kernel["BufferStore"] and kernel["PrefetchGlobalRead"] and kernel["PreloadKernelArguments"] != 1: self.releaseSgprAdressCD = True self.sgprAddressStrCD = "Srd" @@ -5876,7 +5902,13 @@ def lraDeclareAddresses(self, kernel, tP): # used. ############################################################################## def openShadowInit(self, kernel): - return self.getNamedLabelDef("ShadowInitStart") + kStr = self.getNamedLabelDef("ShadowInitStart") + if self.kernel["PreloadKernelArguments"] == 1: + if self.kernel["DelayRemainingArguments"]: + kStr += self.loadKernelArguments() + kernArgBytes = self.sgprPool.numKernargSGPRs * 4 + kStr += inst("s_waitcnt", "lgkmcnt(0)", "wait for %u bytes of kern args" % kernArgBytes ) + return kStr ############################################################################## # closeShadowInit diff --git a/Tensile/Parallel.py b/Tensile/Parallel.py index d7370ed8f..1ffd4873e 100644 --- a/Tensile/Parallel.py +++ b/Tensile/Parallel.py @@ -71,7 +71,7 @@ def ParallelMap(function, objects, message="", enable=True, multiArg=True): if threadCount <= 1 and globalParameters["ShowProgressBar"]: # Provide a progress bar for single-threaded operation. - return list(map(function, Utils.tqdm(objects, message))) + return list(map(lambda objs: function(*objs), Utils.tqdm(objects, message))) countMessage = "" try: diff --git a/Tensile/SolutionStructs.py b/Tensile/SolutionStructs.py index 9a6392646..887533885 100644 --- a/Tensile/SolutionStructs.py +++ b/Tensile/SolutionStructs.py @@ -2990,6 +2990,58 @@ def assignDerivedParameters(state): if state["LocalSplitU"] > 1: reject(state, "Atomic Stream-K not working with LocalSplitU") + if state["KernelLanguage"] == "Assembly" and not state["BufferLoad"]: + # StaggerU only works with source kernels, or with BufferLoad. + # Since StaggerU defaults to 32, override it to 0 if not supported. + state["StaggerU"] = 0 + + def supportsPreloadKernelArguments(): + if not globalParameters["AsmCaps"][isa]["KernargPreloading"]: + return False, f"{isa} doesn't support preloading." + + if not state["ProblemType"]["StridedBatched"]: + return False, "Preloading only supported in StridedBatched mode." + + dt = state["ProblemType"]["DataType"] + if not (dt.isSingle() or dt.isHalf() or dt.isBFloat16()): + return False, f"Preloading not supported for data type {dt}." + + if not state["ProblemType"]["UseBeta"]: + return False, "Preloading only supported with UseBeta." + + if state["ProblemType"]["UseInitialStridesAB"]: + return False, "Preloading not supported with initial strides AB." + + if abs(state["WorkGroupMapping"]) > 1: + return False, "Preloading not supported with WorkGroupMapping." + + if not state["PrefetchGlobalRead"]: + return False, "Preloading must use PrefetchGlobalRead." + + if state["EdgeType"] == "ShiftPtr": + return False, "Preloading not compatible with ShiftPtr." + + if state["StaggerU"] != 0: + return False, "Preloading not compatible with StaggerU." + + return True, "" + + pkaSupported, pkaMsg = supportsPreloadKernelArguments() + if state["PreloadKernelArguments"] == -1: + if pkaSupported: + state["PreloadKernelArguments"] = 1 + else: + state["PreloadKernelArguments"] = 0 + elif state["PreloadKernelArguments"] == 1: + if not pkaSupported: + reject(state, pkaMsg) + + if "DelayRemainingArguments" in state: + if state["DelayRemainingArguments"] and state["PreloadKernelArguments"] != 1: + reject(state, "Delayed kernel arguments only supported when preloading.") + else: + state["DelayRemainingArguments"] = False + if state["VectorStore"] == -1: state["_VectorStore"] = 1 # default, may be changed if needed to generate a valid kernel diff --git a/Tensile/Source/lib/include/Tensile/ContractionSolution.hpp b/Tensile/Source/lib/include/Tensile/ContractionSolution.hpp index 7cda789ac..b205f989c 100644 --- a/Tensile/Source/lib/include/Tensile/ContractionSolution.hpp +++ b/Tensile/Source/lib/include/Tensile/ContractionSolution.hpp @@ -85,6 +85,7 @@ namespace Tensile bool persistentKernelAlongBatch = false; bool sourceKernel = false; + int preloadKernargs = 0; int globalAccumulation = 0; size_t workspaceSizePerElemC = 0; }; diff --git a/Tensile/Source/lib/include/Tensile/Serialization/ContractionSolution.hpp b/Tensile/Source/lib/include/Tensile/Serialization/ContractionSolution.hpp index def53f5a0..731aefe7c 100644 --- a/Tensile/Source/lib/include/Tensile/Serialization/ContractionSolution.hpp +++ b/Tensile/Source/lib/include/Tensile/Serialization/ContractionSolution.hpp @@ -93,6 +93,7 @@ namespace Tensile iot::mapRequired(io, "persistentKernel", s.persistentKernel); iot::mapRequired(io, "persistentKernelAlongBatch", s.persistentKernelAlongBatch); iot::mapRequired(io, "sourceKernel", s.sourceKernel); + iot::mapOptional(io, "preloadKernargs", s.preloadKernargs); iot::mapRequired(io, "globalAccumulation", s.globalAccumulation); iot::mapRequired(io, "workspaceSizePerElemC", s.workspaceSizePerElemC); diff --git a/Tensile/Source/lib/source/ContractionSolution.cpp b/Tensile/Source/lib/source/ContractionSolution.cpp index 81372fee3..e70fc4ddf 100644 --- a/Tensile/Source/lib/source/ContractionSolution.cpp +++ b/Tensile/Source/lib/source/ContractionSolution.cpp @@ -367,6 +367,12 @@ namespace Tensile rv.sharedMemBytes = 0; + size_t startStrideCD = problemType.useInitialStridesCD ? 0 : 1; + size_t startStrideAB = problemType.useInitialStridesAB ? 0 : 1; + + auto problemSizes = problem.problemSizes(); + TENSILE_ASSERT_EXC(problemSizes.size() > 0); + if(!isSourceKernel()) { uint64_t tensor2dSizeC = c.totalAllocatedElements(); @@ -377,9 +383,40 @@ namespace Tensile ? b.totalAllocatedElements() : problem.allocatedElementsNonBatchB(); - rv.args.append("tensor2dSizeC", tensor2dSizeC); - rv.args.append("tensor2dSizeA", tensor2dSizeA); - rv.args.append("tensor2dSizeB", tensor2dSizeB); + if(sizeMapping.preloadKernargs) + { + TENSILE_ASSERT_EXC(problemType.stridedBatched); + TENSILE_ASSERT_EXC(problemType.useBeta); + TENSILE_ASSERT_EXC(startStrideAB == 1); + + rv.args.append("tensor2dSizeA", tensor2dSizeA); + rv.args.append("tensor2dSizeB", tensor2dSizeB); + + auto aptr = inputs.a + a.offset(); + auto bptr = inputs.b + b.offset(); + rv.args.append("a", aptr); + rv.args.append("b", bptr); + + rv.args.append("alpha", inputs.alpha); + if(std::is_same::value && !isSourceKernel()) + rv.args.append("alpha_2", inputs.alpha); + + for(size_t i = startStrideAB; i < a.dimensions(); i++) + rv.args.append(concatenate_if("strideA", i), a.strides()[i]); + + for(size_t i = startStrideAB; i < b.dimensions(); i++) + rv.args.append(concatenate_if("strideB", i), b.strides()[i]); + + rv.args.append("sizeSum", problemSizes.back()); + } + + // rv.args.append("tensor2dSizeC", tensor2dSizeC); + + if(!sizeMapping.preloadKernargs) + { + rv.args.append("tensor2dSizeA", tensor2dSizeA); + rv.args.append("tensor2dSizeB", tensor2dSizeB); + } } if(sizeMapping.globalAccumulation && sizeMapping.streamK < 2) @@ -389,10 +426,8 @@ namespace Tensile } else if(problemType.stridedBatched) { - auto dptr = inputs.d; - dptr += d.offset(); - auto cptr = inputs.c; - cptr += c.offset(); + auto dptr = inputs.d + d.offset(); + auto cptr = inputs.c + c.offset(); rv.args.append("d", dptr); rv.args.append("c", cptr); } @@ -404,12 +439,13 @@ namespace Tensile if(problemType.stridedBatched) { - auto aptr = inputs.a; - aptr += a.offset(); - auto bptr = inputs.b; - bptr += b.offset(); - rv.args.append("a", aptr); - rv.args.append("b", bptr); + if(!sizeMapping.preloadKernargs) + { + auto aptr = inputs.a + a.offset(); + auto bptr = inputs.b + b.offset(); + rv.args.append("a", aptr); + rv.args.append("b", bptr); + } } else { @@ -435,9 +471,12 @@ namespace Tensile rv.args.append("offsetB", b.offset()); } - rv.args.append("alpha", inputs.alpha); - if(std::is_same::value && !isSourceKernel()) - rv.args.append("alpha_2", inputs.alpha); + if(!sizeMapping.preloadKernargs) + { + rv.args.append("alpha", inputs.alpha); + if(std::is_same::value && !isSourceKernel()) + rv.args.append("alpha_2", inputs.alpha); + } if(problemType.useBeta) { @@ -446,9 +485,6 @@ namespace Tensile rv.args.append("beta_2", inputs.beta); } - size_t startStrideCD = problemType.useInitialStridesCD ? 0 : 1; - size_t startStrideAB = problemType.useInitialStridesAB ? 0 : 1; - if(sizeMapping.globalAccumulation && sizeMapping.streamK < 2) { size_t wsStride = startStrideCD ? d.sizes()[0] : 1; @@ -474,18 +510,22 @@ namespace Tensile rv.args.append(concatenate_if("strideC", i), c.strides()[i]); } - for(size_t i = startStrideAB; i < a.dimensions(); i++) - rv.args.append(concatenate_if("strideA", i), a.strides()[i]); + if(!sizeMapping.preloadKernargs) + { + for(size_t i = startStrideAB; i < a.dimensions(); i++) + rv.args.append(concatenate_if("strideA", i), a.strides()[i]); - for(size_t i = startStrideAB; i < b.dimensions(); i++) - rv.args.append(concatenate_if("strideB", i), b.strides()[i]); + for(size_t i = startStrideAB; i < b.dimensions(); i++) + rv.args.append(concatenate_if("strideB", i), b.strides()[i]); + } { - int idx = 0; - for(auto size : problem.problemSizes()) + int maxIdx = problemSizes.size(); + if(sizeMapping.preloadKernargs) + maxIdx--; + for(int idx = 0; idx < maxIdx; idx++) { - rv.args.append(concatenate_if("size_", idx), size); - idx++; + rv.args.append(concatenate_if("size_", idx), problemSizes[idx]); } } @@ -576,7 +616,8 @@ namespace Tensile } } - rv.args.append("staggerUIter", staggerUIter(problem, inputs, hardware)); + if(sizeMapping.staggerU) + rv.args.append("staggerUIter", staggerUIter(problem, inputs, hardware)); rv.args.append("problemNumGroupTiles0", problemNumGroupTiles0); rv.args.append("problemNumGroupTiles1", problemNumGroupTiles1); diff --git a/Tensile/Source/lib/source/hip/HipSolutionAdapter.cpp b/Tensile/Source/lib/source/hip/HipSolutionAdapter.cpp index d3aa6d7ce..8c033aa2b 100644 --- a/Tensile/Source/lib/source/hip/HipSolutionAdapter.cpp +++ b/Tensile/Source/lib/source/hip/HipSolutionAdapter.cpp @@ -35,12 +35,6 @@ #include #include -//@TODO add alternative for windows -#ifndef _WIN32 -#include -#endif -#include - namespace Tensile { namespace hip diff --git a/Tensile/Tests/pre_checkin/preload_kernel_arguments_always_half.yaml b/Tensile/Tests/pre_checkin/preload_kernel_arguments_always_half.yaml new file mode 100644 index 000000000..7b916d944 --- /dev/null +++ b/Tensile/Tests/pre_checkin/preload_kernel_arguments_always_half.yaml @@ -0,0 +1,56 @@ +TestParameters: + marks: [skip-gfx900, skip-gfx906, skip-gfx908, + skip-gfx1010, skip-gfx1011, skip-gfx1012, + skip-gfx1030, skip-gfx1031, skip-gfx1032, + skip-gfx1034, skip-gfx1035, skip-gfx1100, + skip-gfx1101, skip-gfx1102] + +GlobalParameters: + MinimumRequiredVersion: 4.2.0 + NumElementsToValidate: -1 + BoundsCheck: False + KernelTime: True + HardwareMonitor: False + +BenchmarkProblems: + - # hgemm TT + - # ProblemType + OperationType: GEMM + DataType: h + DestDataType: h + ComputeDataType: s + HighPrecisionAccumulate: True + TransposeA: True + TransposeB: True + UseBeta: True + Batched: True + + - # BenchmarkProblemSizeGroup - Assembly + InitialSolutionParameters: + BenchmarkCommonParameters: + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - PreloadKernelArguments: [1] + - DelayRemainingArguments: [True] + + - PrefetchLocalRead: [False] + - PrefetchGlobalRead: [True] + + - EdgeType: ["Branch"] + - ThreadTile: + - [ 16, 8 ] + - WorkGroup: + - [ 16, 16, 1 ] + - DepthU: [32] + - VectorWidth: [-1] + - AssertSummationElementMultiple: [1] + - AssertFree0ElementMultiple: [1] + - StaggerU: [0] + - WorkGroupMapping: [ 1 ] + BenchmarkForkParameters: + JoinParameters: + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Range: [ [129,1,129], 0, [2], [62,1,62] ] diff --git a/Tensile/Tests/pre_checkin/preload_kernel_arguments_half_bfloat16_sgemm.yaml b/Tensile/Tests/pre_checkin/preload_kernel_arguments_half_bfloat16_sgemm.yaml new file mode 100644 index 000000000..70d0c8352 --- /dev/null +++ b/Tensile/Tests/pre_checkin/preload_kernel_arguments_half_bfloat16_sgemm.yaml @@ -0,0 +1,175 @@ +GlobalParameters: + MinimumRequiredVersion: 4.2.0 + NumElementsToValidate: -1 + BoundsCheck: False + KernelTime: True + HardwareMonitor: False + +BenchmarkProblems: + - # hgemm TT + - # ProblemType + OperationType: GEMM + DataType: h + DestDataType: h + ComputeDataType: s + HighPrecisionAccumulate: True + TransposeA: True + TransposeB: True + UseBeta: True + Batched: True + + - # BenchmarkProblemSizeGroup - Assembly + InitialSolutionParameters: + BenchmarkCommonParameters: + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - PreloadKernelArguments: [0, 1] + - DelayRemainingArguments: [False, True] + + - PrefetchLocalRead: [False] + - PrefetchGlobalRead: [False,True] + + - EdgeType: ["Branch", "ShiftPtr"] + - ThreadTile: + - [ 16, 8 ] + - WorkGroup: + - [ 16, 16, 1 ] + - DepthU: [32] + - VectorWidth: [-1] + - AssertSummationElementMultiple: [1] + - AssertFree0ElementMultiple: [1] + - StaggerU: [0, 2, 32] + - WorkGroupMapping: [ 1, 8 ] + BenchmarkForkParameters: + JoinParameters: + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Range: [ [129,1,129], 0, [2], [62,1,62] ] + + - # hgemm NT + - # ProblemType + OperationType: GEMM + DataType: h + DestDataType: h + ComputeDataType: s + HighPrecisionAccumulate: True + TransposeA: False + TransposeB: True + UseBeta: True + Batched: True + + - # BenchmarkProblemSizeGroup - Assembly + InitialSolutionParameters: + BenchmarkCommonParameters: + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - PreloadKernelArguments: [-1] + - DelayRemainingArguments: [False, True] + + - PrefetchLocalRead: [False] + - PrefetchGlobalRead: [False,True] + + - EdgeType: ["Branch", "ShiftPtr"] + - ThreadTile: + - [ 16, 8 ] + - WorkGroup: + - [ 16, 16, 1 ] + - DepthU: [32] + - VectorWidth: [-1] + - AssertSummationElementMultiple: [1] + - AssertFree0ElementMultiple: [1] + - StaggerU: [0, 2, 32] + - WorkGroupMapping: [ 1, 8 ] + BenchmarkForkParameters: + JoinParameters: + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Range: [ [129,1,129], 0, [2], [62,1,62] ] + + - # BFloat16 gemm TT + - # ProblemType + OperationType: GEMM + DataType: B + DestDataType: B + ComputeDataType: s + HighPrecisionAccumulate: True + TransposeA: True + TransposeB: True + UseBeta: True + Batched: True + + - # BenchmarkProblemSizeGroup - Assembly + InitialSolutionParameters: + BenchmarkCommonParameters: + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - PreloadKernelArguments: [0, 1] + - DelayRemainingArguments: [False, True] + + - PrefetchLocalRead: [False] + - PrefetchGlobalRead: [False,True] + + - EdgeType: ["Branch", "ShiftPtr"] + - ThreadTile: + - [ 16, 8 ] + - WorkGroup: + - [ 16, 16, 1 ] + - DepthU: [32] + - VectorWidth: [-1] + - AssertSummationElementMultiple: [1] + - AssertFree0ElementMultiple: [1] + - StaggerU: [0, 2, 32] + - WorkGroupMapping: [ 1, 8 ] + BenchmarkForkParameters: + JoinParameters: + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Range: [ [129,1,129], 0, [2], [62,1,62] ] + + + - # sgemm TT + - # ProblemType + OperationType: GEMM + DataType: s + DestDataType: s + ComputeDataType: s + TransposeA: True + TransposeB: True + UseBeta: True + Batched: True + + - # BenchmarkProblemSizeGroup - Assembly + InitialSolutionParameters: + BenchmarkCommonParameters: + - LoopTail: [True] + - KernelLanguage: ["Assembly"] + ForkParameters: + - PreloadKernelArguments: [0, 1] + - DelayRemainingArguments: [False, True] + + - PrefetchLocalRead: [False] + - PrefetchGlobalRead: [False,True] + + - EdgeType: ["Branch", "ShiftPtr"] + - ThreadTile: + - [ 8, 8 ] + - WorkGroup: + - [ 16, 16, 1 ] + - DepthU: [32] + - VectorWidth: [-1] + - AssertSummationElementMultiple: [1] + - AssertFree0ElementMultiple: [1] + - StaggerU: [0, 2, 32] + - WorkGroupMapping: [ 1, 8 ] + BenchmarkForkParameters: + JoinParameters: + BenchmarkJoinParameters: + BenchmarkFinalParameters: + - ProblemSizes: + - Range: [ [129,1,129], 0, [2], [62,1,62] ] \ No newline at end of file From 1489d85d5542f7fcde7a82270ffafecd87d42d35 Mon Sep 17 00:00:00 2001 From: Koji Nakajima <75698246+nakajee@users.noreply.github.com> Date: Sat, 10 Feb 2024 01:58:33 +0900 Subject: [PATCH 51/51] fix memory allocation fail with FlushMemorySize + StridedBatched/Batched cases (#1881) - multiply batch count size when calculating array size --- Tensile/Source/client/main.cpp | 14 ++++++++------ 1 file changed, 8 insertions(+), 6 deletions(-) diff --git a/Tensile/Source/client/main.cpp b/Tensile/Source/client/main.cpp index 792db82b2..89393d9a5 100644 --- a/Tensile/Source/client/main.cpp +++ b/Tensile/Source/client/main.cpp @@ -2,7 +2,7 @@ * * MIT License * - * Copyright (C) 2019-2022 Advanced Micro Devices, Inc. All rights reserved. + * Copyright (C) 2019-2024 Advanced Micro Devices, Inc. All rights reserved. * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to deal @@ -503,11 +503,13 @@ size_t calculate_flush_count(size_t arg_fl size_t cached_size = 0; for(auto const& problem : problemFactory.problems()) - cached_size = std::max( - cached_size, - problem.a().sizes()[0] * problem.a().sizes()[1] * problem.a().elementBytes() - + problem.b().sizes()[0] * problem.b().sizes()[1] * problem.b().elementBytes() - + problem.c().sizes()[0] * problem.c().sizes()[1] * problem.c().elementBytes()); + { + size_t aSize = problem.a().elementBytes() * problem.a().totalLogicalElements(); + size_t bSize = problem.b().elementBytes() * problem.b().totalLogicalElements(); + size_t cSize = problem.c().elementBytes() * problem.c().totalLogicalElements(); + + cached_size = std::max(cached_size, aSize + bSize + cSize); + } if(arg_flush_count != default_arg_flush_count && arg_flush_memory_size != default_arg_flush_memory_size)