mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-14 18:17:44 +00:00
* Adding RapidJson Library
* Adding Json Dumps in all CK_Tile Examples
Not verified yet
* Adding json to cktile Batched Transpose
* adding json dumps to layernorm2d_fwd
* Adding json dump to flatmm_basic
* Adding RapidJson Library
* Adding Json Dumps in all CK_Tile Examples
Not verified yet
* Adding json to cktile Batched Transpose
* adding json dumps to layernorm2d_fwd
* Adding json dump to flatmm_basic
* Adding json in 03_gemm
* Add json dump to 16_batched_gemm
* Add json dump to gemm_multi_d_fp16
* Add json dump to grouped_gemm
* fix fmha_bwd/fwd
* Fix clang-format errors
exclude include/rapidjson in jenkins as its a third-party library
* Saparating function and defination.
* Update Documentation of 03_gemm
* Refactoring as per code review
* Disable fp8 instances on unsupported targets (#2592)
* Restrict building of gemm_universal_preshuffle_f8 instances to specific targets in CMakeLists.txt
* Add condition to skip gemm_xdl_universal_preshuffle_f8 instances for unsupported targets in CMakeLists.txt
* Add conditions to skip unsupported targets for gemm_universal_preshuffle_f8 and gemm_xdl_universal_preshuffle_f8 instances in CMakeLists.txt
* Refine conditions to exclude gemm_universal_preshuffle_f8 instances for unsupported targets in CMakeLists.txt
---------
Co-authored-by: AviralGoelAMD <aviralgoel@amd.com>
* fix clang format
* remove duplicate lines of code from library/src/tensor_operation_instance/gpu/CMakeLists.txt
* Fixing Readme and unifying jsondumps
* adding moe_smoothquant
* adding fused_moe
* Fixing Readme for batched_gemm
* Fixing Readme for grouped_gemm
* adding flatmm
* adding gemm_multi_d_fp16
* adding elementwise
* adding File name when json is dumped
* Fixing Reduce after merge
* adding batched_transpose
* Adding Warptile in Gemm
* Fixing Clang Format
---------
Co-authored-by: Aviral Goel <aviral.goel@amd.com>
Co-authored-by: AviralGoelAMD <aviralgoel@amd.com>
Co-authored-by: illsilin_amdeng <Illia.Silin@amd.com>
[ROCm/composable_kernel commit: 4d041837ad]
84 lines
2.7 KiB
C++
84 lines
2.7 KiB
C++
// Tencent is pleased to support the open source community by making RapidJSON available.
|
|
//
|
|
// Copyright (C) 2015 THL A29 Limited, a Tencent company, and Milo Yip.
|
|
//
|
|
// Licensed under the MIT License (the "License"); you may not use this file except
|
|
// in compliance with the License. You may obtain a copy of the License at
|
|
//
|
|
// http://opensource.org/licenses/MIT
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software distributed
|
|
// under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
|
|
// CONDITIONS OF ANY KIND, either express or implied. See the License for the
|
|
// specific language governing permissions and limitations under the License.
|
|
|
|
#ifndef RAPIDJSON_INTERNAL_STRFUNC_H_
|
|
#define RAPIDJSON_INTERNAL_STRFUNC_H_
|
|
|
|
#include "../stream.h"
|
|
#include <cwchar>
|
|
|
|
RAPIDJSON_NAMESPACE_BEGIN
|
|
namespace internal {
|
|
|
|
//! Custom strlen() which works on different character types.
|
|
/*! \tparam Ch Character type (e.g. char, wchar_t, short)
|
|
\param s Null-terminated input string.
|
|
\return Number of characters in the string.
|
|
\note This has the same semantics as strlen(), the return value is not number of Unicode codepoints.
|
|
*/
|
|
template <typename Ch>
|
|
inline SizeType StrLen(const Ch* s) {
|
|
RAPIDJSON_ASSERT(s != 0);
|
|
const Ch* p = s;
|
|
while (*p) ++p;
|
|
return SizeType(p - s);
|
|
}
|
|
|
|
template <>
|
|
inline SizeType StrLen(const char* s) {
|
|
return SizeType(std::strlen(s));
|
|
}
|
|
|
|
template <>
|
|
inline SizeType StrLen(const wchar_t* s) {
|
|
return SizeType(std::wcslen(s));
|
|
}
|
|
|
|
//! Custom strcmpn() which works on different character types.
|
|
/*! \tparam Ch Character type (e.g. char, wchar_t, short)
|
|
\param s1 Null-terminated input string.
|
|
\param s2 Null-terminated input string.
|
|
\return 0 if equal
|
|
*/
|
|
template<typename Ch>
|
|
inline int StrCmp(const Ch* s1, const Ch* s2) {
|
|
RAPIDJSON_ASSERT(s1 != 0);
|
|
RAPIDJSON_ASSERT(s2 != 0);
|
|
while(*s1 && (*s1 == *s2)) { s1++; s2++; }
|
|
return static_cast<unsigned>(*s1) < static_cast<unsigned>(*s2) ? -1 : static_cast<unsigned>(*s1) > static_cast<unsigned>(*s2);
|
|
}
|
|
|
|
//! Returns number of code points in a encoded string.
|
|
template<typename Encoding>
|
|
bool CountStringCodePoint(const typename Encoding::Ch* s, SizeType length, SizeType* outCount) {
|
|
RAPIDJSON_ASSERT(s != 0);
|
|
RAPIDJSON_ASSERT(outCount != 0);
|
|
GenericStringStream<Encoding> is(s);
|
|
const typename Encoding::Ch* end = s + length;
|
|
SizeType count = 0;
|
|
while (is.src_ < end) {
|
|
unsigned codepoint;
|
|
if (!Encoding::Decode(is, &codepoint))
|
|
return false;
|
|
count++;
|
|
}
|
|
*outCount = count;
|
|
return true;
|
|
}
|
|
|
|
} // namespace internal
|
|
RAPIDJSON_NAMESPACE_END
|
|
|
|
#endif // RAPIDJSON_INTERNAL_STRFUNC_H_
|