composable_kernel/example/ck_tile/49_sageattention/quant.hpp

// Copyright (c) Advanced Micro Devices, Inc., or its affiliates.
// SPDX-License-Identifier: MIT

#pragma once

#include <ostream>
#include <string>
#include "ck_tile/core.hpp"
#include "ck_tile/ops/sageattention/block/block_sageattention_quant_scale_enum.hpp"

// keep sync with BlockSageAttentionQuantScaleEnum
enum class quant_scale_enum
{
    no_scale   = 0,
    pertensor  = 1,
    blockscale = 2,
    perwarp    = 3,
    perthread  = 4,
};

struct quant_scale_info
{
    quant_scale_enum type;

    void serialize(std::ostream& os) const
    {
        if(type == quant_scale_enum::no_scale)
            os << "n";
        else if(type == quant_scale_enum::pertensor)
            os << "pt";
        else if(type == quant_scale_enum::blockscale)
            os << "bs";
        else if(type == quant_scale_enum::perwarp)
            os << "pw";
        else if(type == quant_scale_enum::perthread)
            os << "pth";
    }

    static quant_scale_info decode(std::string str)
    {
        quant_scale_info info{quant_scale_enum::no_scale};
        if(str == "n" || str == "0")
        {
            info.type = quant_scale_enum::no_scale;
        }
        else if(str == "pt" || str == "1")
        {
            info.type = quant_scale_enum::pertensor;
        }
        else if(str == "bs" || str == "2")
        {
            info.type = quant_scale_enum::blockscale;
        }
        else if(str == "pw" || str == "3")
        {
            info.type = quant_scale_enum::perwarp;
        }
        else if(str == "pth" || str == "4")
        {
            info.type = quant_scale_enum::perthread;
        }
        else
        {
            throw std::invalid_argument("invalid quant scale value: " + str);
        }
        return info;
    }

    friend std::ostream& operator<<(std::ostream& os, const quant_scale_info& qsi)
    {
        qsi.serialize(os);
        return os;
    }
};