Skip to content

Commit

Permalink
Merge pull request #79 from guacamoleo/develop
Browse files Browse the repository at this point in the history
fixed global increments and updating configs
  • Loading branch information
guacamoleo authored Apr 6, 2017
2 parents 35756bd + 4aaf327 commit 43a6c36
Show file tree
Hide file tree
Showing 23 changed files with 949 additions and 130 deletions.
10 changes: 8 additions & 2 deletions Jenkinsfile
Original file line number Diff line number Diff line change
Expand Up @@ -65,8 +65,14 @@ parallel rocm_fiji: {
// run jenkins tests
dir("${build_dir_release}") {
stage("unit tests") {
sh "tensile ../../Tensile/Configs/jenkins_sgemm_defaults.yaml sgemm_defaults"
sh "tensile ../../Tensile/Configs/jenkins_dgemm_defaults.yaml dgemm_defaults"
sh "tensile ../../Tensile/Configs/test_sgemm_defaults.yaml sgemm_defaults"
sh "tensile ../../Tensile/Configs/test_sgemm_scalar_load_patterns.yaml sgemm_scalar_load_patterns"
sh "tensile ../../Tensile/Configs/test_sgemm_scalar_tile_sizes.yaml sgemm_scalar_tile_sizes"
sh "tensile ../../Tensile/Configs/test_sgemm_scalar_branches.yaml sgemm_scalar_branches"
//sh "tensile ../../Tensile/Configs/test_sgemm_vector_load_patterns.yaml sgemm_vector_load_patterns"
//sh "tensile ../../Tensile/Configs/test_sgemm_vector_tile_sizes.yaml sgemm_vector_tile_sizes"
//sh "tensile ../../Tensile/Configs/test_sgemm_vector_branches.yaml sgemm_vector_branches"
sh "tensile ../../Tensile/Configs/test_dgemm_defaults.yaml dgemm_defaults"
}
}
}
Expand Down
13 changes: 10 additions & 3 deletions Tensile/ClientWriter.py
Original file line number Diff line number Diff line change
Expand Up @@ -117,20 +117,27 @@ def writeRunScript(path, libraryLogicPath, forBenchmark):
# runtime and kernel language
runScriptFile.write(" -DTensile_RUNTIME_LANGUAGE=%s" \
% globalParameters["RuntimeLanguage"])
#runScriptFile.write(" -DTensile_KERNEL_LANGUAGE=%s" \
# % globalParameters["KernelLanguage"])
if forBenchmark:
# for benchmark client
runScriptFile.write(" -DTensile_CLIENT_BENCHMARK=ON")
else:
# for library client
runScriptFile.write(" -DTensile_ROOT=%s" % os.path.join(globalParameters["ScriptPath"], "..") )
runScriptFile.write(" -DTensile_ROOT=%s" \
% os.path.join(globalParameters["ScriptPath"], "..") )
runScriptFile.write(" -DTensile_KERNEL_LANGUAGE=%s" \
% globalParameters["KernelLanguage"])
runScriptFile.write(" -DTensile_CLIENT_BENCHMARK=OFF")
runScriptFile.write(" -DTensile_LOGIC_PATH=%s" % libraryLogicPath)
runScriptFile.write(" -DTensile_LIBRARY_PRINT_DEBUG=%s" \
% ("ON" if globalParameters["LibraryPrintDebug"] else "OFF"))
runScriptFile.write(" -DTensile_SHORT_FILE_NAMES=%s" \
% ("ON" if globalParameters["ShortNames"] else "OFF"))
if globalParameters["CMakeCXXFlags"]:
runScriptFile.write(" -DCMAKE_CXX_FLAGS=%s" \
% globalParameters["CMakeCXXFlags"] )
if globalParameters["CMakeCFlags"]:
runScriptFile.write(" -DCMAKE_C_FLAGS=%s" \
% globalParameters["CMakeCFlags"] )
# for both
if os.name == "nt":
runScriptFile.write(" -DCMAKE_GENERATOR_PLATFORM=x64")
Expand Down
6 changes: 4 additions & 2 deletions Tensile/Common.py
Original file line number Diff line number Diff line change
Expand Up @@ -37,6 +37,8 @@
globalParameters["Device"] = 0
# benchmark behavior
globalParameters["CMakeBuildType"] = "Release" # Debug
globalParameters["CMakeCXXFlags"] = ""
globalParameters["CMakeCFlags"] = ""
globalParameters["ForceRedoBenchmarkProblems"] = True
globalParameters["ForceRedoLibraryLogic"] = True
globalParameters["ForceRedoLibraryClient"] = True
Expand All @@ -47,8 +49,8 @@
globalParameters["ShortNames"] = False
globalParameters["MergeFiles"] = True
# validation
globalParameters["NumElementsToValidate"] = 16
globalParameters["ValidationMaxToPrint"] = 16
globalParameters["NumElementsToValidate"] = 128
globalParameters["ValidationMaxToPrint"] = 4
globalParameters["ValidationPrintValids"] = False
globalParameters["DataInitType"] = 0 # 0=rand, 1=1, 2=serial
# protect against invalid kernel
Expand Down
10 changes: 5 additions & 5 deletions Tensile/Configs/rocblas_cgemm.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ GlobalParameters:
SyncsPerBenchmark: 8
LibraryPrintDebug: False
NumElementsToValidate: 128
ValidationMaxToPrint: 16
ValidationMaxToPrint: 4
ValidationPrintValids: False
ShortNames: False
MergeFiles: True
Expand All @@ -30,7 +30,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand Down Expand Up @@ -62,7 +62,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand Down Expand Up @@ -94,7 +94,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand Down Expand Up @@ -126,7 +126,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ -1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand Down
10 changes: 5 additions & 5 deletions Tensile/Configs/rocblas_dgemm.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ GlobalParameters:
SyncsPerBenchmark: 8
LibraryPrintDebug: False
NumElementsToValidate: 128
ValidationMaxToPrint: 16
ValidationMaxToPrint: 4
ValidationPrintValids: False
ShortNames: False
MergeFiles: True
Expand All @@ -30,7 +30,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand Down Expand Up @@ -62,7 +62,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand Down Expand Up @@ -94,7 +94,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand Down Expand Up @@ -126,7 +126,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ -1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand Down
14 changes: 9 additions & 5 deletions Tensile/Configs/rocblas_sgemm.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ GlobalParameters:
SyncsPerBenchmark: 8
LibraryPrintDebug: False
NumElementsToValidate: 128
ValidationMaxToPrint: 16
ValidationMaxToPrint: 4
ValidationPrintValids: False
ShortNames: False
MergeFiles: True
Expand All @@ -30,14 +30,15 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [1], [2880] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
- GroupShape: [ 0 ]
- ThreadTileShape: [ 0 ]
- NumLoadsCoalescedA: [-1]
- NumLoadsCoalescedB: [1]
- VectorWidth: [2]
ForkParameters:
- NumThreads: [64, 128, 256]
- ThreadTileNumElements: [4, 16, 36, 64]
Expand All @@ -62,14 +63,15 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [1], [2880] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
- GroupShape: [ 0 ]
- ThreadTileShape: [ 0 ]
- NumLoadsCoalescedA: [-1]
- NumLoadsCoalescedB: [-1]
- VectorWidth: [2]
ForkParameters:
- NumThreads: [64, 128, 256]
- ThreadTileNumElements: [4, 16, 36, 64]
Expand All @@ -94,12 +96,13 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [2880] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
- NumLoadsCoalescedA: [1]
- NumLoadsCoalescedB: [1]
- VectorWidth: [2]
ForkParameters:
- GroupShape: [ 0, 2 ]
- ThreadTileShape: [ 0, 2 ]
Expand All @@ -126,14 +129,15 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [2880] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ -1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
- ThreadTileShape: [ 0 ]
- NumLoadsCoalescedA: [1]
- NumLoadsCoalescedB: [-1]
- GroupShape: [ 0 ]
- VectorWidth: [2]
ForkParameters:
- NumThreads: [64, 128, 256]
- ThreadTileNumElements: [4, 16, 36, 64]
Expand Down
18 changes: 9 additions & 9 deletions Tensile/Configs/rocblas_zgemm.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@ GlobalParameters:
SyncsPerBenchmark: 8
LibraryPrintDebug: False
NumElementsToValidate: 128
ValidationMaxToPrint: 16
ValidationMaxToPrint: 4
ValidationPrintValids: False
ShortNames: False
MergeFiles: True
Expand All @@ -21,7 +21,7 @@ BenchmarkProblems:
# zgemm NN
- ProblemType:
OperationType: GEMM
DataType: s
DataType: z
TransposeA: False
TransposeB: False
UseBeta: True
Expand All @@ -30,7 +30,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand All @@ -53,7 +53,7 @@ BenchmarkProblems:
# zgemm NT
- ProblemType:
OperationType: GEMM
DataType: s
DataType: z
TransposeA: False
TransposeB: True
UseBeta: True
Expand All @@ -62,7 +62,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand All @@ -85,7 +85,7 @@ BenchmarkProblems:
# zgemm TN
- ProblemType:
OperationType: GEMM
DataType: s
DataType: z
TransposeA: True
TransposeB: False
UseBeta: True
Expand All @@ -94,7 +94,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ 1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand All @@ -117,7 +117,7 @@ BenchmarkProblems:
# zgemm TT
- ProblemType:
OperationType: GEMM
DataType: s
DataType: z
TransposeA: True
TransposeB: True
UseBeta: True
Expand All @@ -126,7 +126,7 @@ BenchmarkProblems:
# keep benchmark as single list to make easier to modify in future
BenchmarkCommonParameters:
- ProblemSizes: [ [2880], [2880], [2], [1536] ]
- EdgeType: ["Branch"]
- EdgeType: ["Shift"]
- WorkGroupMapping: [ -1 ]
- LoopDoWhile: [False]
- LoopTail: [True]
Expand Down
2 changes: 1 addition & 1 deletion Tensile/Configs/sgemm.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@ GlobalParameters:
SyncsPerBenchmark: 1
LibraryPrintDebug: False
NumElementsToValidate: 128
ValidationMaxToPrint: 16
ValidationMaxToPrint: 4
ValidationPrintValids: False
ShortNames: False
MergeFiles: True
Expand Down
Loading

0 comments on commit 43a6c36

Please sign in to comment.