mlc-ai
diff --git a/‎.github/workflows/ci.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/ci.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.pre-commit-config.yaml‎
Lines changed: 4 additions & 4 deletions b/‎.pre-commit-config.yaml‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎cpp/c_api.cc‎
Lines changed: 0 additions & 1 deletion b/‎cpp/c_api.cc‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎cpp/registry.h‎
Lines changed: 277 additions & 52 deletions b/‎cpp/registry.h‎
Lines changed: 277 additions & 52 deletions
diff --git a/‎include/mlc/base/lib.h‎
Lines changed: 6 additions & 0 deletions b/‎include/mlc/base/lib.h‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎include/mlc/base/traits_device.h‎
Lines changed: 15 additions & 74 deletions b/‎include/mlc/base/traits_device.h‎
Lines changed: 15 additions & 74 deletions
diff --git a/‎include/mlc/base/traits_dtype.h‎
Lines changed: 10 additions & 98 deletions b/‎include/mlc/base/traits_dtype.h‎
Lines changed: 10 additions & 98 deletions
diff --git a/‎include/mlc/c_api.h‎
Lines changed: 24 additions & 5 deletions b/‎include/mlc/c_api.h‎
Lines changed: 24 additions & 5 deletions
@@ -3,7 +3,7 @@ name: CI
 on: [push, pull_request]
 env:
   CIBW_BUILD_VERBOSITY: 3
-  CIBW_TEST_REQUIRES: "pytest"
+  CIBW_TEST_REQUIRES: "pytest torch"
   CIBW_TEST_COMMAND: "pytest -svv --durations=20 {project}/tests/python/"
   MLC_CIBW_VERSION: "2.22.0"
   MLC_PYTHON_VERSION: "3.9"
 
@@ -14,21 +14,21 @@ repos:
       - id: check-toml
       - id: check-added-large-files
   - repo: https://github.com/astral-sh/ruff-pre-commit
-    rev: v0.8.4
+    rev: v0.9.0
     hooks:
       - id: ruff
         types_or: [python, pyi, jupyter]
         args: [--fix]
       - id: ruff-format
         types_or: [python, pyi, jupyter]
   - repo: https://github.com/pre-commit/mirrors-mypy
-    rev: "v1.14.0"
+    rev: "v1.14.1"
     hooks:
       - id: mypy
-        additional_dependencies: ['numpy >= 1.22', "ml-dtypes >= 0.1", "pytest"]
+        additional_dependencies: ['numpy >= 1.22', "ml-dtypes >= 0.1", "pytest", "torch"]
         args: [--show-error-codes]
   - repo: https://github.com/pre-commit/mirrors-clang-format
-    rev: "v19.1.5"
+    rev: "v19.1.6"
     hooks:
       - id: clang-format
   - repo: https://github.com/MarcoGorelli/cython-lint
 
@@ -19,7 +19,6 @@ using ::mlc::registry::TypeTable;
 
 namespace {
 thread_local Any last_error;
-MLC_REGISTER_FUNC("mlc.ffi.LoadDSO").set_body([](std::string name) { TypeTable::Get(nullptr)->LoadDSO(name); });
 } // namespace
 
 MLC_API MLCAny MLCGetLastError() {
 
@@ -11,6 +11,12 @@ struct Lib {
   static ::mlc::Str CxxStr(AnyView obj);
   static ::mlc::Str Str(AnyView obj);
   static Any IRPrint(AnyView obj, AnyView printer, AnyView path);
+  static const char *DeviceTypeToStr(int32_t device_type);
+  static int32_t DeviceTypeFromStr(const char *source);
+  static void DeviceTypeRegister(const char *name);
+  static const char *DataTypeCodeToStr(int32_t dtype_code);
+  static DLDataType DataTypeFromStr(const char *source);
+  static void DataTypeRegister(const char *name, int32_t dtype_bits);
 
   static FuncObj *_init(int32_t type_index) { return VTableGetFunc(init, type_index, "__init__"); }
   MLC_INLINE static MLCTypeInfo *GetTypeInfo(int32_t type_index) {
 
@@ -1,15 +1,16 @@
 #ifndef MLC_BASE_TRAITS_DEVICE_H_
 #define MLC_BASE_TRAITS_DEVICE_H_
 
+#include "./lib.h"
 #include "./utils.h"
-#include <unordered_map>
 
 namespace mlc {
 namespace base {
 
-const char *DLDeviceType2Str(DLDeviceType type);
-DLDevice String2DLDevice(const std::string &source);
+DLDevice DeviceFromStr(const std::string &source);
+
 inline bool DeviceEqual(DLDevice a, DLDevice b) { return a.device_type == b.device_type && a.device_id == b.device_id; }
+inline const char *DeviceType2Str(int32_t device_type) { return ::mlc::Lib::DeviceTypeToStr(device_type); }
 
 template <> struct TypeTraits<DLDevice> {
   static constexpr int32_t type_index = static_cast<int32_t>(MLCTypeIndex::kMLCDevice);
@@ -26,10 +27,10 @@ template <> struct TypeTraits<DLDevice> {
       return v->v.v_device;
     }
     if (ty == MLCTypeIndex::kMLCRawStr) {
-      return String2DLDevice(v->v.v_str);
+      return DeviceFromStr(v->v.v_str);
     }
     if (ty == MLCTypeIndex::kMLCStr) {
-      return String2DLDevice(reinterpret_cast<const MLCStr *>(v->v.v_obj)->data);
+      return DeviceFromStr(reinterpret_cast<const MLCStr *>(v->v.v_obj)->data);
     }
     throw TemporaryTypeError();
   }
@@ -38,87 +39,27 @@ template <> struct TypeTraits<DLDevice> {
 
   MLC_INLINE static std::string __str__(DLDevice device) {
     std::ostringstream os;
-    os << DLDeviceType2Str(static_cast<DLDeviceType>(device.device_type)) << ":" << device.device_id;
+    os << DeviceType2Str(static_cast<DLDeviceType>(device.device_type)) << ":" << device.device_id;
     return os.str();
   }
-
-  static inline MLC_SYMBOL_HIDE std::unordered_map<std::string, DLDeviceType> str2device_type = {
-      {"cpu", kDLCPU},
-      {"cuda", kDLCUDA},
-      {"cuda_host", kDLCUDAHost},
-      {"opencl", kDLOpenCL},
-      {"vulkan", kDLVulkan},
-      {"mps", kDLMetal},
-      {"vpi", kDLVPI},
-      {"rocm", kDLROCM},
-      {"rocm_host", kDLROCMHost},
-      {"ext_dev", kDLExtDev},
-      {"cuda_managed", kDLCUDAManaged},
-      {"oneapi", kDLOneAPI},
-      {"webgpu", kDLWebGPU},
-      {"hexagon", kDLHexagon},
-      {"maia", kDLMAIA},
-      // aliases
-      {"llvm", kDLCPU},
-      {"nvptx", kDLCUDA},
-      {"cl", kDLOpenCL},
-      {"sdaccel", kDLOpenCL},
-      {"metal", kDLMetal},
-  };
 };
 
-MLC_INLINE const char *DLDeviceType2Str(DLDeviceType type) {
-  switch (type) {
-  case kDLCPU:
-    return "cpu";
-  case kDLCUDA:
-    return "cuda";
-  case kDLCUDAHost:
-    return "cuda_host";
-  case kDLOpenCL:
-    return "opencl";
-  case kDLVulkan:
-    return "vulkan";
-  case kDLMetal:
-    return "mps";
-  case kDLVPI:
-    return "vpi";
-  case kDLROCM:
-    return "rocm";
-  case kDLROCMHost:
-    return "rocm_host";
-  case kDLExtDev:
-    return "ext_dev";
-  case kDLCUDAManaged:
-    return "cuda_managed";
-  case kDLOneAPI:
-    return "oneapi";
-  case kDLWebGPU:
-    return "webgpu";
-  case kDLHexagon:
-    return "hexagon";
-  case kDLMAIA:
-    return "maia";
-  }
-  return "unknown";
-}
-
-inline DLDevice String2DLDevice(const std::string &source) {
+inline DLDevice DeviceFromStr(const std::string &source) {
   constexpr int64_t i32_max = 2147483647;
-  using Traits = TypeTraits<DLDevice>;
-  DLDeviceType device_type;
+  int32_t device_type;
   int64_t device_id = 0;
   try {
     if (size_t c_pos = source.rfind(':'); c_pos != std::string::npos) {
-      device_type = Traits::str2device_type.at(source.substr(0, c_pos));
+      device_type = ::mlc::Lib::DeviceTypeFromStr(source.substr(0, c_pos).c_str());
       device_id = StrToInt(source, c_pos + 1);
     } else {
-      device_type = Traits::str2device_type.at(source);
+      device_type = ::mlc::Lib::DeviceTypeFromStr(source.c_str());
+      device_id = 0;
     }
-    if (device_id < 0 || device_id > i32_max) {
-      throw std::runtime_error("Invalid device id");
+    if (device_type < 0 || device_id < 0 || device_id > i32_max) {
+      throw std::runtime_error(""); // Going to catch it below
     }
-    return DLDevice{device_type, static_cast<int32_t>(device_id)};
+    return DLDevice{static_cast<DLDeviceType>(device_type), static_cast<int32_t>(device_id)};
   } catch (...) {
   }
   MLC_THROW(ValueError) << "Cannot convert to `Device` from string: " << source;
 
@@ -1,18 +1,18 @@
 #ifndef MLC_BASE_TRAITS_DTYPE_H_
 #define MLC_BASE_TRAITS_DTYPE_H_
 
+#include "./lib.h"
 #include "./utils.h"
-#include <cstdlib>
-#include <unordered_map>
 
 namespace mlc {
 namespace base {
 
-inline const char *DLDataTypeCode2Str(int32_t type_code);
-inline DLDataType String2DLDataType(const std::string &source);
+inline DLDataType DataTypeFromStr(const char *source);
+
 inline bool DataTypeEqual(DLDataType a, DLDataType b) {
   return a.code == b.code && a.bits == b.bits && a.lanes == b.lanes;
 }
+inline const char *DataTypeCode2Str(int32_t type_code) { return ::mlc::Lib::DataTypeCodeToStr(type_code); }
 
 template <> struct TypeTraits<DLDataType> {
   static constexpr int32_t type_index = static_cast<int32_t>(MLCTypeIndex::kMLCDataType);
@@ -29,10 +29,10 @@ template <> struct TypeTraits<DLDataType> {
       return v->v.v_dtype;
     }
     if (ty == MLCTypeIndex::kMLCRawStr) {
-      return String2DLDataType(v->v.v_str);
+      return DataTypeFromStr(v->v.v_str);
     }
     if (ty == MLCTypeIndex::kMLCStr) {
-      return String2DLDataType(reinterpret_cast<const MLCStr *>(v->v.v_obj)->data);
+      return DataTypeFromStr(reinterpret_cast<const MLCStr *>(v->v.v_obj)->data);
     }
     throw TemporaryTypeError();
   }
@@ -50,107 +50,19 @@ template <> struct TypeTraits<DLDataType> {
       return "void";
     }
     std::ostringstream os;
-    os << DLDataTypeCode2Str(code);
-    if (code != kDLDataTypeFloat8E5M2 && code != kDLDataTypeFloat8E4M3FN) {
+    os << DataTypeCode2Str(code);
+    if (code < kMLCExtension_DLDataTypeCode_Begin) {
+      // for `code >= kMLCExtension_DLDataTypeCode_Begin`, the `bits` is already encoded in `code`
       os << bits;
     }
     if (lanes != 1) {
       os << "x" << lanes;
     }
     return os.str();
   }
-
-  static inline MLC_SYMBOL_HIDE std::unordered_map<std::string, DLDataType> preset = {
-      {"void", {kDLOpaqueHandle, 0, 0}},
-      {"bool", {kDLUInt, 1, 1}},
-      {"int4", {kDLInt, 4, 1}},
-      {"int8", {kDLInt, 8, 1}},
-      {"int16", {kDLInt, 16, 1}},
-      {"int32", {kDLInt, 32, 1}},
-      {"int64", {kDLInt, 64, 1}},
-      {"uint4", {kDLUInt, 4, 1}},
-      {"uint8", {kDLUInt, 8, 1}},
-      {"uint16", {kDLUInt, 16, 1}},
-      {"uint32", {kDLUInt, 32, 1}},
-      {"uint64", {kDLUInt, 64, 1}},
-      {"float8_e4m3fn", {kDLDataTypeFloat8E4M3FN, 8, 1}},
-      {"float8_e5m2", {kDLDataTypeFloat8E5M2, 8, 1}},
-      {"float16", {kDLFloat, 16, 1}},
-      {"float32", {kDLFloat, 32, 1}},
-      {"float64", {kDLFloat, 64, 1}},
-      {"bfloat16", {kDLBfloat, 16, 1}},
-  };
 };
 
-MLC_INLINE const char *DLDataTypeCode2Str(int32_t type_code) {
-  switch (type_code) {
-  case kDLInt:
-    return "int";
-  case kDLUInt:
-    return "uint";
-  case kDLFloat:
-    return "float";
-  case kDLOpaqueHandle:
-    return "ptr";
-  case kDLBfloat:
-    return "bfloat";
-  case kDLComplex:
-    return "complex";
-  case kDLBool:
-    return "bool";
-  case kDLDataTypeFloat8E4M3FN:
-    return "float8_e4m3fn";
-  case kDLDataTypeFloat8E5M2:
-    return "float8_e5m2";
-  }
-  return "unknown";
-}
-
-inline DLDataType String2DLDataType(const std::string &source) {
-  constexpr int64_t u16_max = 65535;
-  constexpr int64_t u8_max = 255;
-  using Traits = TypeTraits<DLDataType>;
-  if (auto it = Traits::preset.find(source); it != Traits::preset.end()) {
-    return it->second;
-  }
-  try {
-    int64_t dtype_lanes = 1;
-    std::string dtype_str;
-    if (size_t x_pos = source.rfind('x'); x_pos != std::string::npos) {
-      dtype_str = source.substr(0, x_pos);
-      dtype_lanes = StrToInt(source, x_pos + 1);
-      if (dtype_lanes < 0 || dtype_lanes > u16_max) {
-        throw std::runtime_error("Invalid DLDataType");
-      }
-    } else {
-      dtype_str = source;
-    }
-    if (dtype_str == "float8_e4m3fn") {
-      return {static_cast<uint8_t>(kDLDataTypeFloat8E4M3FN), 8, static_cast<uint16_t>(dtype_lanes)};
-    }
-    if (dtype_str == "float8_e5m2") {
-      return {static_cast<uint8_t>(kDLDataTypeFloat8E5M2), 8, static_cast<uint16_t>(dtype_lanes)};
-    }
-#define MLC_DTYPE_PARSE_(str, prefix, prefix_len, dtype_code)                                                          \
-  if (str.length() >= prefix_len && str.compare(0, prefix_len, prefix) == 0) {                                         \
-    int64_t dtype_bits = StrToInt(str, prefix_len);                                                                    \
-    if (dtype_bits < 0 || dtype_bits > u8_max) {                                                                       \
-      throw std::runtime_error("Invalid DLDataType");                                                                  \
-    }                                                                                                                  \
-    return {static_cast<uint8_t>(dtype_code), static_cast<uint8_t>(dtype_bits), static_cast<uint16_t>(dtype_lanes)};   \
-  }
-    MLC_DTYPE_PARSE_(dtype_str, "int", 3, kDLInt)
-    MLC_DTYPE_PARSE_(dtype_str, "uint", 4, kDLUInt)
-    MLC_DTYPE_PARSE_(dtype_str, "float", 5, kDLFloat)
-    MLC_DTYPE_PARSE_(dtype_str, "ptr", 3, kDLOpaqueHandle)
-    MLC_DTYPE_PARSE_(dtype_str, "bfloat", 6, kDLBfloat)
-    MLC_DTYPE_PARSE_(dtype_str, "complex", 7, kDLComplex)
-#undef MLC_DTYPE_PARSE_
-  } catch (...) {
-  }
-  MLC_THROW(ValueError) << "Cannot convert to `dtype` from string: " << source;
-  MLC_UNREACHABLE();
-}
+inline DLDataType DataTypeFromStr(const char *source) { return ::mlc::Lib::DataTypeFromStr(source); }
 
 } // namespace base
 } // namespace mlc
 
@@ -30,11 +30,30 @@
 extern "C" {
 #endif
 
-typedef enum {
-  // TODO: 1) add complete set of fp8 support; 2) allow more flexible dtype definition
-  kDLDataTypeFloat8E4M3FN = 7,
-  kDLDataTypeFloat8E5M2 = 8,
-} DLDataTypeCodeExtension;
+typedef enum { // ranged [0, 2 ** 8)
+  kMLCExtension_DLDataTypeCode_Begin = 7,
+  // 8-bit floating point representations
+  kDLDataTypeFloat8Begin = 7,
+  kDLDataTypeFloat8E3M4 = 7,
+  kDLDataTypeFloat8E4M3 = 8,
+  kDLDataTypeFloat8E4M3B11FNUZ = 9,
+  kDLDataTypeFloat8E4M3FN = 10,
+  kDLDataTypeFloat8E4M3FNUZ = 11,
+  kDLDataTypeFloat8E5M2 = 12,
+  kDLDataTypeFloat8E5M2FNUZ = 13,
+  kDLDataTypeFloat8E8M0FNU = 14,
+  kDLDataTypeFloat8End = 15,
+  // Microscaling (MX) sub-byte floating point representations
+  kDLDataTypeFloat4E2M1FN = 15, // higher 4 bits are unused
+  kDLDataTypeFloat6E2M3FN = 16, // higher 2 bits are unused
+  kDLDataTypeFloat6E3M2FN = 17, // higher 2 bits are unused
+  kMLCExtension_DLDataTypeCode_End = kDLDataTypeFloat6E3M2FN,
+} MLCExtension_DLDataTypeCode;
+
+typedef enum { // ranged [0, 2 ** 32)
+  kMLCExtension_DLDeviceType_Begin = 18,
+  kMLCExtension_DLDeviceType_End = kMLCExtension_DLDeviceType_Begin,
+} MLCExtension_DLDeviceType;
 
 #ifdef __cplusplus
 enum MLCTypeIndex : int32_t {