Skip to content

Commit acc40ab

Browse files
committed
update cubin export
Signed-off-by: Anthony Chang <[email protected]>
1 parent 35d9db3 commit acc40ab

File tree

1,418 files changed

+21029
-9378
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

1,418 files changed

+21029
-9378
lines changed
Lines changed: 78 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,78 @@
1+
---
2+
AccessModifierOffset: -4
3+
AlignAfterOpenBracket: DontAlign
4+
AlignConsecutiveAssignments: None
5+
AlignConsecutiveDeclarations: None
6+
AlignOperands: false
7+
AlignTrailingComments: true
8+
AllowAllParametersOfDeclarationOnNextLine: true
9+
AllowShortBlocksOnASingleLine: Empty
10+
AllowShortCaseLabelsOnASingleLine: true
11+
AllowShortFunctionsOnASingleLine: Empty
12+
AllowShortIfStatementsOnASingleLine: false
13+
AllowShortLoopsOnASingleLine: false
14+
AlwaysBreakAfterDefinitionReturnType: None
15+
AlwaysBreakAfterReturnType: None
16+
AlwaysBreakBeforeMultilineStrings: true
17+
AlwaysBreakTemplateDeclarations: Yes
18+
BasedOnStyle: None
19+
BinPackArguments: true
20+
BinPackParameters: true
21+
BreakBeforeBinaryOperators: All
22+
BreakBeforeBraces: Allman
23+
BreakBeforeTernaryOperators: true
24+
BreakConstructorInitializersBeforeComma: true
25+
ColumnLimit: 120
26+
CommentPragmas: '^ IWYU pragma:'
27+
ConstructorInitializerAllOnOneLineOrOnePerLine: false
28+
ConstructorInitializerIndentWidth: 4
29+
ContinuationIndentWidth: 4
30+
Cpp11BracedListStyle: true
31+
DerivePointerAlignment: false
32+
DisableFormat: false
33+
ExperimentalAutoDetectBinPacking: false
34+
ForEachMacros: [ foreach, Q_FOREACH, BOOST_FOREACH ]
35+
IncludeBlocks: Preserve
36+
IncludeCategories:
37+
- Regex: '^"(llvm|llvm-c|clang|clang-c)/'
38+
Priority: 2
39+
- Regex: '^(<|"(gtest|isl|json)/)'
40+
Priority: 3
41+
- Regex: '.*'
42+
Priority: 1
43+
IndentCaseLabels: false
44+
IndentWidth: 4
45+
IndentWrappedFunctionNames: false
46+
KeepEmptyLinesAtTheStartOfBlocks: true
47+
Language: Cpp
48+
MacroBlockBegin: ''
49+
MacroBlockEnd: ''
50+
MaxEmptyLinesToKeep: 1
51+
NamespaceIndentation: None
52+
ObjCBlockIndentWidth: 4
53+
ObjCSpaceAfterProperty: true
54+
ObjCSpaceBeforeProtocolList: true
55+
PenaltyBreakBeforeFirstCallParameter: 19
56+
PenaltyBreakComment: 300
57+
PenaltyBreakFirstLessLess: 120
58+
PenaltyBreakString: 1000
59+
PenaltyExcessCharacter: 1000000
60+
PenaltyReturnTypeOnItsOwnLine: 60
61+
PointerAlignment: Left
62+
QualifierAlignment: Right
63+
ReflowComments: true
64+
SeparateDefinitionBlocks: Always
65+
SortIncludes: false
66+
SpaceAfterCStyleCast: true
67+
SpaceBeforeAssignmentOperators: true
68+
SpaceBeforeParens: ControlStatements
69+
SpaceInEmptyParentheses: false
70+
SpacesBeforeTrailingComments: 1
71+
SpacesInAngles: false
72+
SpacesInCStyleCastParentheses: false
73+
SpacesInContainerLiterals: true
74+
SpacesInParentheses: false
75+
SpacesInSquareBrackets: false
76+
Standard: c++14
77+
TabWidth: 4
78+
UseTab: Never

cpp/tensorrt_llm/kernels/trtllmGenKernels/batchedGemm/trtllmGen_bmm_export/BatchedGemmEnums.h

Lines changed: 11 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,8 @@
1616
*/
1717
#pragma once
1818

19-
#include <cassert>
2019
#include <string>
20+
#include <cassert>
2121

2222
namespace batchedGemm
2323
{
@@ -34,7 +34,9 @@ enum class RouteImpl
3434
// Use LDGSTS to do the routing
3535
Ldgsts = 1,
3636
// Use UTMALDG.GATHER4 to do the routing
37-
Tma = 2
37+
Tma = 2,
38+
// Use LDG+STS to do the routing
39+
LdgPlusSts = 3
3840
};
3941

4042
////////////////////////////////////////////////////////////////////////////////////////////////////
@@ -60,6 +62,13 @@ inline bool doesRouteImplUseTma(RouteImpl mode)
6062

6163
////////////////////////////////////////////////////////////////////////////////////////////////////
6264

65+
inline bool doesRouteImplUseLdgPlusSts(RouteImpl mode)
66+
{
67+
return (mode == RouteImpl::LdgPlusSts);
68+
}
69+
70+
////////////////////////////////////////////////////////////////////////////////////////////////////
71+
6372
} // namespace batchedGemm
6473

6574
////////////////////////////////////////////////////////////////////////////////////////////////////

0 commit comments

Comments
 (0)