-
Notifications
You must be signed in to change notification settings - Fork 545
/
weightUtils.hpp
66 lines (54 loc) · 2.7 KB
/
weightUtils.hpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
/*
* SPDX-License-Identifier: Apache-2.0
*/
#pragma once
#include "ShapedWeights.hpp"
#include "bfloat16.hpp"
#include "half.h"
#include <NvInfer.h>
#include <typeindex>
#include <unordered_map>
// Subset of helper functions that deal exclusively with weights to be shared across IParser and IParserRefitter classes.
// Define weightLog Macros here to ensure that an ImporterCtx class is not needed to log.
namespace onnx2trt
{
// Return the name of an ONNX data enum.
char const* getDtypeName(int32_t onnxDtype);
// Return the size in bits of an ONNX data type.
int32_t getDtypeSizeBits(int32_t onnxDtype);
// Return the size in bytes of an tensor/weights object, handle sub-byte padding.
size_t getTensorOrWeightsSizeBytes(int64_t count, int32_t onnxDtype);
// Find the corresponding ONNX data type of a built-in data type.
template <typename T>
ShapedWeights::DataType getShapedWeightsDataType()
{
static std::unordered_map<std::type_index, ::ONNX_NAMESPACE::TensorProto::DataType> const tMap({
{std::type_index(typeid(bool)), ::ONNX_NAMESPACE::TensorProto::BOOL},
{std::type_index(typeid(int8_t)), ::ONNX_NAMESPACE::TensorProto::INT8},
{std::type_index(typeid(uint8_t)), ::ONNX_NAMESPACE::TensorProto::UINT8},
{std::type_index(typeid(int16_t)), ::ONNX_NAMESPACE::TensorProto::INT16},
{std::type_index(typeid(uint16_t)), ::ONNX_NAMESPACE::TensorProto::UINT16},
{std::type_index(typeid(int32_t)), ::ONNX_NAMESPACE::TensorProto::INT32},
{std::type_index(typeid(uint32_t)), ::ONNX_NAMESPACE::TensorProto::UINT32},
{std::type_index(typeid(int64_t)), ::ONNX_NAMESPACE::TensorProto::INT64},
{std::type_index(typeid(uint64_t)), ::ONNX_NAMESPACE::TensorProto::UINT64},
{std::type_index(typeid(float)), ::ONNX_NAMESPACE::TensorProto::FLOAT},
{std::type_index(typeid(double)), ::ONNX_NAMESPACE::TensorProto::DOUBLE},
{std::type_index(typeid(half_float::half)), ::ONNX_NAMESPACE::TensorProto::FLOAT16},
{std::type_index(typeid(BFloat16)), ::ONNX_NAMESPACE::TensorProto::BFLOAT16},
// TRT-22989: Add fp8 and int4 support
});
if (tMap.find(std::type_index(typeid(T))) != tMap.end())
{
return tMap.at(std::type_index(typeid(T)));
}
return ::ONNX_NAMESPACE::TensorProto::UNDEFINED;
}
// Return the volume of a Dims object
int64_t volume(nvinfer1::Dims const& dims);
// Normalize the slashes in a string representing a filepath.
std::string normalizePath(std::string const& path);
// Generate a unique name for a given weight or tensor name (passed as the |basename|)
std::string const& generateUniqueName(
std::set<std::string>& namesSet, int64_t& suffixCounter, std::string const& basename);
} // namespace onnx2trt