From b844ac0bc149aa08efca75758a4e3026a735d9b7 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 17 Oct 2025 16:19:47 +0000
Subject: [PATCH 01/48] add rocm support

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .gitignore                        |   8 +-
 fastsafetensors/common.py         |   5 +
 fastsafetensors/copier/gds.py     |  17 ++-
 fastsafetensors/cpp/cuda_compat.h |  33 +++++
 fastsafetensors/cpp/ext.cpp       |   3 +-
 fastsafetensors/cpp/ext.hpp       |   6 +
 fastsafetensors/dlpack.py         |  22 +++-
 setup.py                          | 199 +++++++++++++++++++++++++++++-
 tests/conftest.py                 |  13 ++
 tests/platform_utils.py           |  81 ++++++++++++
 tests/test_fastsafetensors.py     |   6 +
 11 files changed, 381 insertions(+), 12 deletions(-)
 create mode 100644 fastsafetensors/cpp/cuda_compat.h
 create mode 100644 tests/platform_utils.py

diff --git a/.gitignore b/.gitignore
index acc54b9..cbe6914 100644
--- a/.gitignore
+++ b/.gitignore
@@ -9,4 +9,10 @@ htmlcov/
 .vscode
 *.log
 *.pyc
-examples/paddle_case/log
\ No newline at end of file
+*.so
+examples/paddle_case/log
+
+# Auto-generated hipified files and directories (created during ROCm build)
+fastsafetensors/cpp/hip/
+fastsafetensors/cpp/*.hip.*
+fastsafetensors/cpp/hip_compat.h
\ No newline at end of file
diff --git a/fastsafetensors/common.py b/fastsafetensors/common.py
index d369975..7dcd581 100644
--- a/fastsafetensors/common.py
+++ b/fastsafetensors/common.py
@@ -13,6 +13,11 @@
 from .frameworks import FrameworkOpBase, TensorBase
 from .st_types import Device, DType
 
+# Add compatibility alias for is_cuda_found -> is_hip_found
+# This allows code written for CUDA to work transparently on both CUDA and ROCm
+if not hasattr(fstcpp, 'is_cuda_found'):
+    fstcpp.is_cuda_found = fstcpp.is_hip_found
+
 
 def get_device_numa_node(device: Optional[int]) -> Optional[int]:
     if device is None or not sys.platform.startswith("linux"):
diff --git a/fastsafetensors/copier/gds.py b/fastsafetensors/copier/gds.py
index 4dc1d7c..5f2ec3a 100644
--- a/fastsafetensors/copier/gds.py
+++ b/fastsafetensors/copier/gds.py
@@ -27,12 +27,17 @@ def __init__(
         self.fh: Optional[fstcpp.gds_file_handle] = None
         self.copy_reqs: Dict[int, int] = {}
         self.aligned_length = 0
-        cudavers = list(map(int, framework.get_cuda_ver().split(".")))
-        # CUDA 12.2 (GDS version 1.7) introduces support for non O_DIRECT file descriptors
-        # Compatible with CUDA 11.x
-        self.o_direct = not (
-            cudavers[0] > 12 or (cudavers[0] == 12 and cudavers[1] >= 2)
-        )
+        cuda_ver = framework.get_cuda_ver()
+        if cuda_ver and cuda_ver != "None":
+            cudavers = list(map(int, cuda_ver.split(".")))
+            # CUDA 12.2 (GDS version 1.7) introduces support for non O_DIRECT file descriptors
+            # Compatible with CUDA 11.x
+            self.o_direct = not (
+                cudavers[0] > 12 or (cudavers[0] == 12 and cudavers[1] >= 2)
+            )
+        else:
+            # ROCm or non-CUDA platform, use O_DIRECT
+            self.o_direct = True
 
     def set_o_direct(self, enable: bool):
         self.o_direct = enable
diff --git a/fastsafetensors/cpp/cuda_compat.h b/fastsafetensors/cpp/cuda_compat.h
new file mode 100644
index 0000000..0c3cc69
--- /dev/null
+++ b/fastsafetensors/cpp/cuda_compat.h
@@ -0,0 +1,33 @@
+/*
+ * Copyright 2024 IBM Inc. All rights reserved
+ * SPDX-License-Identifier: Apache-2.0
+ *
+ * CUDA/HIP compatibility layer for fastsafetensors
+ * Minimal compatibility header - only defines what hipify-perl doesn't handle
+ */
+
+#pragma once
+
+// Platform detection - this gets hipified to check __HIP_PLATFORM_AMD__
+#ifdef __HIP_PLATFORM_AMD__
+  #ifndef USE_ROCM
+    #define USE_ROCM
+  #endif
+  #include <hip/hip_runtime.h>
+#else
+  // For CUDA platform, or when CUDA headers aren't available, we define minimal types in ext.hpp
+#endif
+
+// Runtime library name - hipify-perl doesn't change string literals
+#ifdef USE_ROCM
+  #define GPU_RUNTIME_LIB "libamdhip64.so"
+#else
+  #define GPU_RUNTIME_LIB "libcudart.so"
+#endif
+
+// Custom function pointer names that hipify-perl doesn't recognize
+// These are our own naming in ext_funcs struct, not standard CUDA API
+#ifdef USE_ROCM
+  #define cudaDeviceMalloc hipDeviceMalloc
+  #define cudaDeviceFree hipDeviceFree
+#endif
diff --git a/fastsafetensors/cpp/ext.cpp b/fastsafetensors/cpp/ext.cpp
index 4f08894..f48d937 100644
--- a/fastsafetensors/cpp/ext.cpp
+++ b/fastsafetensors/cpp/ext.cpp
@@ -10,6 +10,7 @@
 #include <chrono>
 #include <dlfcn.h>
 
+#include "cuda_compat.h"
 #include "ext.hpp"
 
 #define ALIGN 4096
@@ -89,7 +90,7 @@ template <typename T> void mydlsym(T** h, void* lib, std::string const& name) {
 static void load_nvidia_functions() {
     cudaError_t (*cudaGetDeviceCount)(int*);
     const char* cufileLib = "libcufile.so.0";
-    const char* cudartLib = "libcudart.so";
+    const char* cudartLib = GPU_RUNTIME_LIB;
     const char* numaLib = "libnuma.so.1";
     bool init_log = getenv(ENV_ENABLE_INIT_LOG);
     int mode = RTLD_LAZY | RTLD_GLOBAL | RTLD_NODELETE;
diff --git a/fastsafetensors/cpp/ext.hpp b/fastsafetensors/cpp/ext.hpp
index eafd24c..2f7c5d9 100644
--- a/fastsafetensors/cpp/ext.hpp
+++ b/fastsafetensors/cpp/ext.hpp
@@ -15,6 +15,8 @@
 #include <pybind11/pybind11.h>
 #include <pybind11/stl.h>
 
+#include "cuda_compat.h"
+
 #define ENV_ENABLE_INIT_LOG "FASTSAFETENSORS_ENABLE_INIT_LOG"
 
 #ifndef __MOD_NAME__
@@ -33,8 +35,12 @@ typedef struct CUfileDescr_t {
     const void *fs_ops; /* CUfileFSOps_t */
 } CUfileDescr_t;
 typedef struct CUfileError { CUfileOpError err; } CUfileError_t;
+
+// Only define minimal CUDA types if not using ROCm (where real headers are included)
+#ifndef USE_ROCM
 typedef enum cudaError { cudaSuccess = 0, cudaErrorMemoryAllocation = 2 } cudaError_t;
 enum cudaMemcpyKind { cudaMemcpyHostToDevice=2, cudaMemcpyDefault = 4 };
+#endif
 
 
 typedef enum CUfileFeatureFlags {
diff --git a/fastsafetensors/dlpack.py b/fastsafetensors/dlpack.py
index 007487a..1d4338e 100644
--- a/fastsafetensors/dlpack.py
+++ b/fastsafetensors/dlpack.py
@@ -12,6 +12,23 @@
 _c_str_dltensor = b"dltensor"
 
 
+# Detect GPU type at module load time
+def _detect_gpu_type():
+    """Detect if we're running on ROCm or CUDA"""
+    try:
+        import torch
+        if torch.cuda.is_available():
+            # Check if this is ROCm build
+            if hasattr(torch.version, 'hip') and torch.version.hip is not None:
+                return 10  # kDLROCM
+    except:
+        pass
+    return 2  # kDLCUDA
+
+
+_GPU_DEVICE_TYPE = _detect_gpu_type()
+
+
 class DLDevice(ctypes.Structure):
     def __init__(self, dev: Device):
         self.device_type = self.DeviceToDL[dev.type]
@@ -19,6 +36,7 @@ def __init__(self, dev: Device):
 
     kDLCPU = 1
     kDLCUDA = 2
+    kDLROCM = 10
     _fields_ = [
         ("device_type", ctypes.c_int),
         ("device_id", ctypes.c_int),
@@ -26,8 +44,8 @@ def __init__(self, dev: Device):
 
     DeviceToDL = {
         DeviceType.CPU: kDLCPU,
-        DeviceType.CUDA: kDLCUDA,
-        DeviceType.GPU: kDLCUDA,
+        DeviceType.CUDA: _GPU_DEVICE_TYPE,
+        DeviceType.GPU: _GPU_DEVICE_TYPE,
     }
 
 
diff --git a/setup.py b/setup.py
index b052909..adecf4e 100644
--- a/setup.py
+++ b/setup.py
@@ -2,11 +2,132 @@
 # SPDX-License-Identifier: Apache-2.0
 
 import os
+import re
+import shutil
+from pathlib import Path
 
 from setuptools import Extension, setup
+from setuptools.command.build_ext import build_ext
 
 
-def MyExtension(name, sources, mod_name, *args, **kwargs):
+def detect_platform():
+    """
+    Detect if we're on NVIDIA CUDA or AMD ROCm platform.
+
+    Returns:
+        tuple: (platform_type, rocm_version, rocm_path)
+            platform_type: 'cuda' or 'rocm'
+            rocm_version: ROCm version string (e.g., '7.0.1') or None
+            rocm_path: Path to ROCm installation or None
+    """
+    # Check for ROCm installation
+    rocm_path = os.environ.get("ROCM_PATH")
+    if not rocm_path:
+        # Try common ROCm installation paths
+        for path in ["/opt/rocm", "/opt/rocm-*"]:
+            if "*" in path:
+                import glob
+                matches = sorted(glob.glob(path), reverse=True)
+                if matches:
+                    rocm_path = matches[0]
+                    break
+            elif os.path.exists(path):
+                rocm_path = path
+                break
+
+    # Check if ROCm is available
+    if rocm_path and os.path.exists(rocm_path):
+        # Detect ROCm version
+        rocm_version = None
+        version_file = os.path.join(rocm_path, ".info", "version")
+        if os.path.exists(version_file):
+            with open(version_file, "r") as f:
+                rocm_version = f.read().strip()
+        else:
+            # Try to extract version from path
+            match = re.search(r'rocm[-/](\d+\.\d+(?:\.\d+)?)', rocm_path)
+            if match:
+                rocm_version = match.group(1)
+
+        print(f"Detected ROCm platform at {rocm_path}")
+        if rocm_version:
+            print(f"ROCm version: {rocm_version}")
+        return ('rocm', rocm_version, rocm_path)
+
+    # Check for CUDA
+    cuda_home = os.environ.get("CUDA_HOME") or os.environ.get("CUDA_PATH")
+    if not cuda_home:
+        # Try to find nvcc
+        nvcc_path = shutil.which("nvcc")
+        if nvcc_path:
+            cuda_home = os.path.dirname(os.path.dirname(nvcc_path))
+
+    if cuda_home and os.path.exists(cuda_home):
+        print(f"Detected CUDA platform at {cuda_home}")
+        return ('cuda', None, None)
+
+    # Default to CUDA if nothing detected
+    print("No GPU platform detected, defaulting to CUDA")
+    return ('cuda', None, None)
+
+
+def hipify_source_files(rocm_path):
+    """
+    Automatically hipify CUDA source files to HIP using torch.utils.hipify.
+    The cuda_compat.h header handles what hipify doesn't convert.
+
+    Args:
+        rocm_path: Path to ROCm installation
+
+    Returns:
+        list: Paths to hipified source files
+    """
+    from torch.utils.hipify.hipify_python import hipify
+
+    cpp_dir = Path("fastsafetensors/cpp").resolve()
+
+    # Prepare source files for hipification
+    extra_files = [
+        str(cpp_dir / "ext.cpp"),
+        str(cpp_dir / "ext.hpp"),
+    ]
+
+    print(f"Hipifying files using torch.utils.hipify:")
+    for f in extra_files:
+        print(f"  - {f}")
+
+    # Use torch's hipify - similar to vLLM's approach
+    hipify_result = hipify(
+        project_directory=str(cpp_dir.parent),
+        output_directory=str(cpp_dir),
+        header_include_dirs=[],
+        includes=[f"{cpp_dir}/*"],
+        extra_files=extra_files,
+        show_detailed=False,
+        is_pytorch_extension=False,
+        hipify_extra_files_only=True,
+    )
+
+    hipified_files = []
+    for source_path, result in hipify_result.items():
+        if hasattr(result, 'hipified_path') and result.hipified_path:
+            print(f"Successfully hipified: {source_path} -> {result.hipified_path}")
+            hipified_files.append(result.hipified_path)
+
+    # Copy cuda_compat.h to hip directory as hip_compat.h
+    # (hipify converts the include statement from cuda_compat.h to hip_compat.h)
+    hip_dir = cpp_dir / "hip"
+    if hip_dir.exists():
+        cuda_compat = cpp_dir / "cuda_compat.h"
+        hip_compat = hip_dir / "hip_compat.h"
+        shutil.copy2(cuda_compat, hip_compat)
+        print(f"Copied {cuda_compat} -> {hip_compat}")
+
+    return hipified_files
+
+
+
+def MyExtension(name, sources, mod_name, platform_type, rocm_path=None, *args, **kwargs):
     import pybind11
 
     pybind11_path = os.path.dirname(pybind11.__file__)
@@ -21,9 +142,78 @@ def MyExtension(name, sources, mod_name, *args, **kwargs):
     # https://pybind11.readthedocs.io/en/stable/faq.html#someclass-declared-with-greater-visibility-than-the-type-of-its-field-someclass-member-wattributes
     kwargs["extra_compile_args"] = ["-fvisibility=hidden", "-std=c++17"]
 
+    # Platform-specific configuration
+    if platform_type == 'rocm' and rocm_path:
+        # ROCm/HIP configuration
+        kwargs["define_macros"].append(("__HIP_PLATFORM_AMD__", "1"))
+        kwargs["libraries"].append("amdhip64")
+        kwargs["library_dirs"] = [f"{rocm_path}/lib"]
+        kwargs["include_dirs"].append(f"{rocm_path}/include")
+        kwargs["extra_compile_args"].append("-D__HIP_PLATFORM_AMD__")
+        kwargs["extra_link_args"] = [f"-L{rocm_path}/lib", "-lamdhip64"]
+
     return Extension(name, sources, *args, **kwargs)
 
 
+class CustomBuildExt(build_ext):
+    """Custom build_ext to handle automatic hipification for ROCm platforms"""
+
+    def run(self):
+        # Detect platform
+        platform_type, rocm_version, rocm_path = detect_platform()
+
+        # Store platform info
+        self.platform_type = platform_type
+        self.rocm_version = rocm_version
+        self.rocm_path = rocm_path
+
+        #  Configure build based on platform
+        if platform_type == 'rocm' and rocm_path:
+            print("=" * 60)
+            print("Building for AMD ROCm platform")
+            if rocm_version:
+                print(f"ROCm version: {rocm_version}")
+            print("=" * 60)
+
+            # Hipify sources
+            hipify_source_files(rocm_path)
+
+            # Update extension sources to use hipified files
+            for ext in self.extensions:
+                new_sources = []
+                for src in ext.sources:
+                    if 'fastsafetensors/cpp/ext.cpp' in src:
+                        # torch.utils.hipify creates files in hip/ subdirectory
+                        new_sources.append(src.replace('fastsafetensors/cpp/ext.cpp', 'fastsafetensors/cpp/hip/ext.cpp'))
+                    else:
+                        new_sources.append(src)
+                ext.sources = new_sources
+
+                # Update include dirs to include hip/ subdirectory
+                ext.include_dirs.append("fastsafetensors/cpp/hip")
+
+                # Update extension with ROCm-specific settings
+                ext.define_macros.append(("__HIP_PLATFORM_AMD__", "1"))
+                ext.define_macros.append(("USE_ROCM", "1"))
+                ext.libraries.append("amdhip64")
+                ext.library_dirs = [f"{rocm_path}/lib"]
+                ext.include_dirs.append(f"{rocm_path}/include")
+                ext.extra_compile_args.append("-D__HIP_PLATFORM_AMD__")
+                ext.extra_compile_args.append("-DUSE_ROCM")
+                ext.extra_link_args = [f"-L{rocm_path}/lib", "-lamdhip64"]
+        else:
+            print("=" * 60)
+            print("Building for NVIDIA CUDA platform")
+            print("=" * 60)
+
+        # Continue with normal build
+        build_ext.run(self)
+
+
+# Detect platform for package_data
+platform_type, _, rocm_path_detected = detect_platform()
+package_data_patterns = ["*.hpp", "*.h", "cpp.pyi"]
+
 setup(
     packages=[
         "fastsafetensors",
@@ -32,13 +222,18 @@ def MyExtension(name, sources, mod_name, *args, **kwargs):
         "fastsafetensors.frameworks",
     ],
     include_package_data=True,
-    package_data={"fastsafetensors.cpp": ["*.hpp", "cpp.pyi"]},
+    package_data={"fastsafetensors.cpp": package_data_patterns},
     ext_modules=[
         MyExtension(
             name=f"fastsafetensors.cpp",
             sources=["fastsafetensors/cpp/ext.cpp"],
             include_dirs=["fastsafetensors/cpp"],
             mod_name="cpp",
+            platform_type=platform_type,
+            rocm_path=rocm_path_detected,
         )
     ],
+    cmdclass={
+        'build_ext': CustomBuildExt,
+    },
 )
diff --git a/tests/conftest.py b/tests/conftest.py
index 96d2f95..5960d3c 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -1,4 +1,5 @@
 import os
+import sys
 from typing import List
 
 import pytest
@@ -9,7 +10,10 @@
 from fastsafetensors.frameworks import FrameworkOpBase, get_framework_op
 from fastsafetensors.st_types import Device
 
+# Add tests directory to path to import platform_utils
 TESTS_DIR = os.path.dirname(__file__)
+sys.path.insert(0, TESTS_DIR)
+from platform_utils import get_platform_info, is_rocm_platform
 REPO_ROOT = os.path.dirname(os.path.dirname(TESTS_DIR))
 DATA_DIR = os.path.join(REPO_ROOT, ".testdata")
 TF_DIR = os.path.join(DATA_DIR, "transformers_cache")
@@ -20,6 +24,15 @@
 load_nvidia_functions()
 FRAMEWORK = get_framework_op(os.getenv("TEST_FASTSAFETENSORS_FRAMEWORK", "please set"))
 
+# Print platform information at test startup
+platform_info = get_platform_info()
+print("\n" + "=" * 60)
+print("Platform Detection:")
+print("=" * 60)
+for key, value in platform_info.items():
+    print(f"  {key}: {value}")
+print("=" * 60 + "\n")
+
 
 @pytest.fixture(scope="session", autouse=True)
 def framework() -> FrameworkOpBase:
diff --git a/tests/platform_utils.py b/tests/platform_utils.py
new file mode 100644
index 0000000..a7c8c31
--- /dev/null
+++ b/tests/platform_utils.py
@@ -0,0 +1,81 @@
+# Copyright 2024 IBM Inc. All rights reserved
+# SPDX-License-Identifier: Apache-2.0
+
+"""Utilities for platform detection and conditional test execution."""
+
+import pytest
+
+
+def is_rocm_platform():
+    """Detect if running on ROCm/AMD platform."""
+    try:
+        import torch
+        if torch.cuda.is_available():
+            if hasattr(torch.version, 'hip') and torch.version.hip is not None:
+                return True
+    except:
+        pass
+    return False
+
+
+def is_cuda_platform():
+    """Detect if running on CUDA/NVIDIA platform."""
+    return not is_rocm_platform()
+
+
+# List of tests that are expected to fail on ROCm (based on TEST_RESULTS.md)
+ROCM_EXPECTED_FAILURES = {
+    'test_GdsFileCopier',  # GDS not available on AMD
+}
+
+# List of tests with memory leak detection issues on ROCm (non-critical)
+ROCM_MEMORY_LEAK_TESTS = {
+    'test_SafeTensorsFileLoader',
+    'test_SafeTensorsFileLoaderNoGds',
+    'test_fastsafe_open',
+    'test_int8',
+    'test_float8_e5m2',
+    'test_float8_e4m3fn',
+    'test_float8_e4m3fn_to_int8',
+    'test_cpp_metrics',
+}
+
+
+def skip_if_rocm_expected_failure(test_name):
+    """Skip test if it's an expected failure on ROCm."""
+    if is_rocm_platform() and test_name in ROCM_EXPECTED_FAILURES:
+        pytest.skip(f"Test '{test_name}' is expected to fail on ROCm (GDS not supported)")
+
+
+def xfail_if_rocm_memory_leak(test_name):
+    """Mark test as expected to fail on ROCm due to memory leak detection issues."""
+    if is_rocm_platform() and test_name in ROCM_MEMORY_LEAK_TESTS:
+        return pytest.mark.xfail(
+            reason=f"Test '{test_name}' has memory leak detection issues on ROCm (non-critical)",
+            strict=False
+        )
+    return lambda func: func
+
+
+def get_platform_info():
+    """Get platform information for debugging."""
+    info = {
+        'is_rocm': is_rocm_platform(),
+        'is_cuda': is_cuda_platform(),
+    }
+
+    try:
+        import torch
+        if torch.cuda.is_available():
+            info['torch_version'] = torch.__version__
+            if is_rocm_platform():
+                info['hip_version'] = torch.version.hip
+                info['rocm_version'] = torch.version.hip
+            else:
+                info['cuda_version'] = torch.version.cuda
+            info['device_count'] = torch.cuda.device_count()
+            info['device_name'] = torch.cuda.get_device_name(0) if torch.cuda.device_count() > 0 else None
+    except:
+        pass
+
+    return info
diff --git a/tests/test_fastsafetensors.py b/tests/test_fastsafetensors.py
index dcbdccd..1606571 100644
--- a/tests/test_fastsafetensors.py
+++ b/tests/test_fastsafetensors.py
@@ -2,6 +2,7 @@
 # SPDX-License-Identifier: Apache-2.0
 
 import os
+import sys
 from collections import OrderedDict
 from typing import Any, Dict, List, Tuple
 
@@ -17,6 +18,10 @@
 from fastsafetensors.frameworks import FrameworkOpBase
 from fastsafetensors.st_types import Device, DeviceType, DType
 
+# Add tests directory to path to import platform_utils
+sys.path.insert(0, os.path.dirname(__file__))
+from platform_utils import skip_if_rocm_expected_failure
+
 
 def load_safetensors_file(
     filename: str,
@@ -326,6 +331,7 @@ def test_NoGdsFileCopier(fstcpp_log, input_files, framework) -> None:
 
 def test_GdsFileCopier(fstcpp_log, input_files, framework) -> None:
     print("test_GdsFileCopier")
+    skip_if_rocm_expected_failure("test_GdsFileCopier")
     meta = SafeTensorsMetadata.from_file(input_files[0], framework)
     device, dev_is_gpu = get_and_check_device(framework)
     reader = fstcpp.gds_file_reader(4, dev_is_gpu)

From 73b2674c43d4dd5663310682fd0f4d40e73ea5e6 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Sun, 19 Oct 2025 05:55:20 +0000
Subject: [PATCH 02/48] add rocm documentation

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 README.md                            |  16 ++++++++--
 docs/amd-perf.md                     |  43 +++++++++++++++++++++++++++
 docs/images/fastsafetensors-rocm.png | Bin 0 -> 54504 bytes
 3 files changed, 57 insertions(+), 2 deletions(-)
 create mode 100644 docs/amd-perf.md
 create mode 100644 docs/images/fastsafetensors-rocm.png

diff --git a/README.md b/README.md
index bcacbce..c692e10 100644
--- a/README.md
+++ b/README.md
@@ -48,8 +48,9 @@ Please refer to [Foundation Model Stack Community Code of Conduct](https://githu
 
 Takeshi Yoshimura, Tatsuhiro Chiba, Manish Sethi, Daniel Waddington, Swaminathan Sundararaman. (2025) Speeding up Model Loading with fastsafetensors [arXiv:2505.23072](https://arxiv.org/abs/2505.23072) and IEEE CLOUD 2025.
 
+## For NVIDIA
 
-## Install from PyPI
+### Install from PyPI
 
 See https://pypi.org/project/fastsafetensors/
 
@@ -57,8 +58,19 @@ See https://pypi.org/project/fastsafetensors/
 pip install fastsafetensors
 ```
 
-## Install from source
+### Install from source
 
 ```bash
 pip install .
 ```
+
+## For ROCm
+
+### Install from source
+
+On ROCm, there are not GDS equivalent support. So fastsafetensors support only supports `nogds=True` mode.
+The performance gain example can be found at [amd-perf.md](./docs/amd-perf.md)
+
+```bash
+python3 setup.py develop
+```
diff --git a/docs/amd-perf.md b/docs/amd-perf.md
new file mode 100644
index 0000000..433ff59
--- /dev/null
+++ b/docs/amd-perf.md
@@ -0,0 +1,43 @@
+# Performance of safetensors on AMD GPUs
+
+## DeepSeek-R1 vLLM Model Weight Loading Speed
+
+This benchmark compares the performance of `safetensors` vs `fastsafetensors` when loading model weights on AMD GPUs.
+
+NOTES: `fastsafetensors` does not support GDS feature on ROCm as there are no GDS alternative on ROCm.
+
+### Benchmark Methodology
+
+1. **Clear system cache** to ensure consistent starting conditions:
+   ```bash
+   sudo sh -c 'sync && echo 3 > /proc/sys/vm/drop_caches'
+   ```
+
+2. **Launch vLLM** with either `--load-format safetensors` or `--load-format fastsafetensors`:
+
+    ```bash
+    MODEL=EmbeddedLLM/deepseek-r1-FP8-Dynamic
+
+    VLLM_USE_V1=1 \
+    VLLM_ROCM_USE_AITER=1 \
+    vllm serve $MODEL \
+    --tensor-parallel-size 8 \
+    --disable-log-requests \
+    --compilation-config '{"cudagraph_mode": "FULL_AND_PIECEWISE"}' \
+    --trust-remote-code \
+    --load-format fastsafetensors \
+    --block-size 1
+    ```
+
+### Results
+
+The experiments are carried on MI300X.
+
+**Cache Scenarios:**
+- **No cache**: Model weights are loaded after clearing the system cache (cold start).
+- **Cached**: Model weights are loaded immediately after a previous load. The weights are cached in the filesystem and RAM (warm start).
+
+<img src="./images/fastsafetensors-rocm.png" alt="FastSafeTensors on ROCm" width="70%">
+
+
+
diff --git a/docs/images/fastsafetensors-rocm.png b/docs/images/fastsafetensors-rocm.png
new file mode 100644
index 0000000000000000000000000000000000000000..526b695e16aa4716a590668d9f9b08e34d1c43c8
GIT binary patch
literal 54504
zcmeFZcT`l_*DZ><)mGbpn2@#wl^`@IA|PPa0?9e6hzLl|83WplC|VLEo5&f-xwQo)
zN|uZw6d44H9Nydt{k6aGy)o_|_l<GyeV5TaBvjQoXYUo}nrp88r;OCOb!&F4VPIfb
zM>&65j)7r?Ed#@{Uw>MO-}tRu<BNX;EzhV}%9~uZw7F!i%OH8l()7BC<#qkbzgp{>
zTj-k@AL2gBeVFUlYnGO#7D7BcM*qBk+r(UthlOpg6+UFO>3LNP28Ion$p1?s#KQF%
z7^)R1r%x!@2KF`E*={-Wx!|jf`KhI=Z#+DH@_hP<Uw+wg^Ve|KRcn{73D#)&W7l);
zmblC*`Q=K=r!|-JEdOi8i50TPzx*Wd(*eEZ{5NhN`c$HsC#G`MuY~nW*Dv-Xv&YJh
zUCE4&jtUQVp!)h7+~qC!3AaJME(&YuHZS@9J;U*@zYHz?{=KW@#{WgWoukF5zB;>X
z)p~{gh7`tMe);w8n@^4xLPT?7vQ|Cynw@C(<fi4k`Sf9KcDguIJ@xUEClMR>o{gY9
z-nZuGpDpb~R&Cg=QQN$Xfg#^z!pmwELz|0ixKvQG<K*y3-wo^6D;XFVbX!IIG&a~e
zxb^0P9sJ^Z_Uu_<Y}1y%#A)cSRa2ktvLsv3q(VbO-?z4EKYR8pN-ZU-rzSeQvos+3
z%)PBW4Jpw}mo60#oge8emCtjY^$G}3=b%fR5z7tUro+{<jyt8hD%|kh!#&2uPEJl8
zG+KC(H)pgxy(daNEiNv1%Anb-klFpg1MXYFb0&U=^{K^HN%G-RJ=Kx&estPpe2q>I
z=Fzf5fBp5iVw8gH<9(9VFV1aPxBHmNrAwE56Yj2<?oVs24wKx;ENK2RCTr<Vv!lDX
z%Z07`B3N8z60Zv_+w#Wep!#8xmSeuUJlR7h{YF<XxZiYTVraWOKR0Xt^(~X84?ZnD
z-_@ozMm2N1#lfnln%%cURaI5Us>f??qJ4u=OSbAOy>cH`qsCN8$$%p%*@M)>)_ou4
z*4f;cxuUDf&dDheE*(<)*R56bk#e!#*7>=#V7t!k&E~}i?P)<a3OV-lq=7IaN&my|
z5B{DLxUA(KMOwNJFSi<MJ8@7o>9ouIbSwR@RV)!M^K-h*{FF+3gw1PBhK@4adz15q
zeQhf)u3DbW;JQgQ&pBrxdqk?^%NH*zWy{enSvFSIbgnGiH~-a=ZHf^xC#VXsYAH!w
zJBktm19z4B9Xc1S6k9nnIZ~5p)tfX>IiH<s)M(I}>%?9B{Q2{u2m!ap{{B%nmaQ_V
zPtxuA@a&YT%{jxmI4e8nQvSNGAe$C5ty8yd-Yj~q4&NAZ#maF%%D(i*EjznUm~F~1
zKBsfjfKsfQV!6n8U_**w_``?41c^GSIgAg~OwoH&Oh278YR*ilo}$_;Ph=&#ZP1jS
z7}{SFC@A0E-ECaFYW=RRt?pYao4)3?-xp|+!LE1*2gkj9$x5u-etve`s_VlZJ-=J4
zHuQ7`nAGAao+Lf<TCsfjfqnbJVzNH{#>XeesT}8JX`DPBr<pZcDZ!)PoM~0YCnzXr
zKUS~Db1y!bmJ>YISO0iE5YLdVv7N!SL&&=C8f(U}HN9WnKkj_9LF};SvEe_uKRmk?
zsT?1?dfhsHQBlz_^Nymh6Sr1g&39eWNp|&pX=!O%aFDQ#|D(O<{INIwcv{++Rc|dn
zv#|AHPm!@Fe*A_$f-oH3f+zY_VHtG6yuzm^ZUy$=c5};!2@rL%zcD=yBMHzce2{Ul
zHO(YsvQTX9(#j3HudAgQ8yVEa8F45^U2$}Dyx`5Dc%j(mVCkt1B3Ei-)oH2yNxH>r
zn#Z#%D=SO>{&TbB_&~Gd>C?Brj*J|_Yx$Hl%-pt%I;Phr>YTeVZSm~+?r|8b-#Hei
z>f~z`uN5NY-cC$S`6nd&UKJ_7|Inq^%V~*UN7Xuv^sw>!`1xy&&5l-unY9<}`}NoS
z<*QZ&aBF5haa+sO*?9NwzfX@;%S-zmF=}`cr5L?KTU&ecmMvG{ofopK`%CtE9=j|$
zH=$$k<=sZlM!l<7{iQ`G{~qmctUG<~T)-Mejwi0J44WAlb>a8AbM$x@ztK@k&qjM8
z<LR;fLs>S1M^4@OnK#9thA%faH_W=fq0A^LDXAn`zpA8EptbLMd0k!I>C>m5TrKtY
zgQ5Db-n{QgX@Edh%J|Gkc~-L3rJOULx;1cj{^}W6S3jvBp$zZ-*1SCRdRSzZm)+bX
zP14>z)2=_I?!vvT2QSFTJRCW?Q|E%XxVs;pu6xG(+_Yq4s*z-nkktiK(}b^Izw-X|
z*I!}Sz^g-Te|6qvaeikbHtZnMSsr4NY1w`G=B-<j9Yx-fch@tQWZR7dHtOo>1*Emu
z7k^vm7?q0Kw{Jf&ZqD=@%$sk~5k@TOtdbVv*D3Je)y%ZyUAN=#?=?}1hhSp+4jg#*
zcR_)_sMFLFPtmD&SFT)1H`4xSG5vbvVBWZr^K5{iMcDS=FS<q|UPdZJQooLm3&_gK
zhB-}-bxzVk1XizJJ(>Gp^1Z_ak(|~C%)(b;K40X@8XFti1?8!RiY<m!u)hmZQV+<J
z{(0}-Av{^xxY;G`-jTt#Bi!_q{3=0<&XVmTuh;TCIeUMHAK9zz+x74Ky#2ECbiV-2
zdU||NV1wwy(@4c=A7X436&0NbR)^uaLm$(qjz@w7u6_8`Hy0tXVw+CM=ePGtv2E93
zC|74@W-ee+OP=uRlzeS39EmO7rc)Lus3SVjwyY{#nq@OHv(eIJ%OsB<ca7A{O6{(V
z4fwW6=H^L-M)GoUB@#S2SK_h;gf?&8deza%N%H*pKlJO9LhU~PxxXaDWlr^CBh%yY
zqrt6pYc->Ed|P{S5pOKstP^-*P!mO-q$)yo??~UP^3G{Lb*~ZH$&8GQt8+7xonwtA
z0>o`koH$WXUS3YDt2aKc<wD@mikG3G87XzRIp49VvHspfZM<jSzI_FuefM~ByOiQs
z3uok*qeseuMGU_^Mzk^yv2CQm3l}dwjnvM|-7aJqp_*lFl-uYtdaQWbPvt{9w#r6u
zy|(jYXm?$F$hXZ@NqkNWttMJofVgf(hmU$mbbPLXQk;frTkf*s6kw3!><1|MS#~3x
zC+Bb0!)q-*|Ghd*D0gO9qMb%lju86X-hQ9=?FL)qR?XU+*|EmA_NDuz0#zbXnb+Ul
ze(0)4aq8Q3woF_q7o!lPFWT|&@QkG8&Bn@1%Y1APe)Q<lZo4m!?v3&D@l^t66c{;3
zFByDEd3>SNpMS)uG)yX}N2wh9cmc+~mY(SZKQeAKY0YguY}_>Qys-d=OYg1AG8*ho
zCvYL`q}v+q;<CF!dga0V{f%in3N8+#U7u=OLf6~g7i4NvjMr-Jx9w}mX$;k95qo~l
zbGMONia|$h*`$ooKvRaBbNPmCzvm;PGWO7IvBSf$v_Y5oEJ3HK<cxvL-eIQ@r_qXY
z#{Ij*oU=bT8P&%4QN+c~>vIztwQO@4kF+%>>p#}7j;J`(8+6p{@?R!vHmun^v_t1Y
zZ*6RIL-Ed=UZZN>;|-RD%r;MUnq*hBPp2ou)7_Q~hURXywRd81p15T3mQmUEdK!%9
zD&Eu?9^%Xg)bUki9|uQ~&V&NBJZxlmr8KjU<?nmXdb~@E<BUsx9eB*HQb$v4X6RII
z-PBqZ3tE{~qcs3b*yXqGD~xG_gC->8*<H{2eYjTniECQ&gP`#I!NkJd#Wt-wk6iDv
zp5+a@Mk}{-nVSsPuZwFw<0+3&Sn~YLJ&lF{F_&BkV#l5*h5($J<Cf&j&t*yYQFo6>
zSjBko?h_Sli4~FdT*cz};mXykTBEj1^kbY-`2hg|hQ>Mc+LK0A371ZJPOoE7+S9he
zRn9bWsTQRZ4rN|1x_9rJ+js74wV$T0%*F-HRcSPu-pX}5u87XhSiG_sY*~74yLLo^
z%jpmojfukZW=mU4@@8vo9UPeKvtHlMb`u$}X)-(atT7f*X|lstTO)OR%aG8n2TOZb
zuUW$v85zk<KWx;H{9*Rp&Y?N@oAHaZwe}>hXuHhTgszt^EG;Z7G^(GJ(VLn0>SjD>
zzS{OaZ>OJLuo<VAekH3fpWS=}eN^cD+qJfA_^n;%^Z3HIEvH&qS|;ygG39EHtlW5J
zHU2c#-<Wk>+smk&^Fn@>Rj(55UDiDjan3doi%yTiUb^2Qy+GZVbfu1*BOT*&98&q}
zTkDoe#}B@3$%B<2LLBByC=nTNY9DLx{_?6jJNvJyw^JN;qIy_qhqQTx(!oapZBBzZ
z<L=2U1X8L`yFE$^e!V<9)T(bdcfidKz}!&J+}vEFhrMW0$AcGU&5sCwVAQa`x3_ng
zWgo)-zTbX(9a@4s(v|A6L2M>L!f&8CD=Q}L^AqhTofQ45eVey!Q|ZcG&nz_hyf7<*
zri#@@RNi90bEy_XXld?a(WS1XM|VANWB~v+XRph)vk*bH_7^Y-hF^zjW?AdQUj1P$
zNU<GqgC5%td3kw#am;m^wgxgOnLKv*utJE_n4j}x2NP~sf>SBxgTr7>c-BCs1Ymuc
z`Rw#~9bP?(K$S&zdh5>E0BkbC>pWvi%S3WY_bM$ZsRovK*=UldN$;tVzjiIceylH2
zpw+P|G{kOlaxzlFm)rmMOE+^TJ9oyar%5@C^;LvP28@0!Wa)M1j5B4QFW6~v)J4?g
zR45~-QhLoaxzwm86@fJR(wjROCCp8L@ufk+%0TZjj*i&_IpbQs_F9f#&-AzC2)E8L
z)gsp()+zXzW^wn;Gu(>;LAGT<!u&P^8vKT}B^h%7bM^>CJZka0XPdKZ>f9MQlbvVn
zo9%mJxqGF9ghD4rXu=^Z!qyiW(@bnc$H&L(@Rk&##v{0dI>NC(Km@sNO^j+)Yz|7P
zuAxtFxQhq!=AC0z5>Fb|##BVezR;*eMb!Q5?(WPk=PP=8y*<(KwKrF+O*X9KKB%3m
zf!Oen72h<4_A%QuJwt>yEDsi$!t?T@4iOnCIb={3R;tS%Z-rW{$p`gCM!r$ft5=E{
z=DLzkem?;yQbks7AZw80x8F`uzx4OV0<`ydD{EB%$fsN_-9c_wJ@tA;U;Qg9pqk9;
zaZi_-Q+|GaD^m46WPxuGyQAP}ityRg;we-DFc)d}KmPa-C}@!ks}LFcsKc!*6@09F
zSX4OPd3I`th<$QriQkJ5=P8P?%|JEWir#F~s{i5X32t5GIE_fG@X?SEF`K=6_i7g1
z-z8Yt(ZpTkSXZ!Z9kY;vzP>(pah7HGb1X2b2hDE}Yt^HWf^6}DzEw#{$%mNUI>h%5
z`-2qNhjq)Aq~tio`uh4|I=u#vI3A@HvEnJf{u*GGlX)$`uigqr;I1CL292q)K0MlS
zz<s?a1FTi^uxY6I{ubOYhJv&P9^uP}DveyJI0>MHvAQll|9H+wneY_7PMcn@7ZM3L
z&#lWn6Zr5Y@aMYie1FHf5VHqhNpToAHu{)wf~;1fGxJf?{Qje(ef9EdnYgQAVDxrR
zu}mi)&uzRX3q4u#x^h*XB|p&Af@4P^_=R2Ydrq*3wiDfZ2fx7=xvTIG|3i9GH|Sd|
z=gwDJl#9@;*SDY=R7<+@=Mm$k2wyFGim2#(4x<$A7P~A8{3t;M=x>U<XV<y`YvM2B
zkXoDsw-9vUj@8lHQCPI?1%B!t?XD`*UAOZ{wO)u*7*ed^n>*`v2p9+MT7TDK7V#w_
zRKiy)IsS}bIiOr9K%(8TyCcrEfi6ZPb6S--4mPByYRGX&gFS_r<W8RD$(u<MvKi<z
zFIn<b!AmvyXNLJV$L@dO>XP-UxP%)qeo=O{EU;T6&$?gD*Gj};tRyY2q~wCdSf8q|
z?is(V%56Fib_vRLJ>qb7cJBOhfAG+R)z^FV372lEJK52;m6#YeWQ$II+3d@Qdc703
zZ`?5~wQA_2jwj>C!q*;c2u9JxQ=i`4&GN3#vWZt0f$?*iiou5Z`CRm`UJV1lHDf<y
z-KRpE^77i^YjuC8K$%Ul6##8<(`}Ls)u-*wQFrQ;EZcCbO=;luBZuG?LqOEso^HGa
zO{Q<waqEgmYMTXzM@keKEFT0!ZYpZEZNJa0d(7z|9iWd}Y2HK7MyoTHXRx<JKUuEj
z(OYFrD{pnb?2)gX%&}IVrehL@AMA61n>7{L`mf~^W6FAf61&LA353V6$SUq5`=j=|
zO-3b#7rO1`iOp29%RDkW5;D&vH!qUYqHA?<s9FqPkEztp8hJ=iX+m$_ywU7j5{&4r
z?uSien#la3_@q26d+%B{KX&=BbT2!U!c9dQw#~D^u1&R`yG0swLd-2JG|yJ%p}^&C
zB;n4;%fQ+?wb4*5kllB9Eb;ffwi3M`?d+T9X9r!fyaY|#Tv068uv?6j3S@a9H$4sx
z9yr2w5=Bc>QO;CPw6PWNeOehEB^;7}f4|ZC-N(8#@_?Xy>BtG(@t%r+y1SxDw2m2}
z)A|4W^H1aWdQF?=4!Jn(JZJ9S*rVkhUuU+5gxuY2|1Px2EzgtI(LKJ2A)&J4Q1%Lj
zHZLEaFi=t5cXk@fT)!T3^XAPj9UW|U-|S&wVM&wK!{?QS1RU1?yla+?g1Sr&w+3QG
zB?tAGTCQV;g#!vr6#8Bf@ruz(HU9jDqxs7=ylZXE%TGe6v!A8c5z@o6ck`xAqX=)&
zr|zzgl6`T9Lm{GVS4Us>KtI!fjqDd@GqZ`IODk5c%)B2X>QXp8;yl$IemTWP3pS)4
zG?+c|Ks^f{YtcA%*{Ic~)oFNS#6onOPFDnrpjo7GlrNm{RVaQ&CSg6*01SwJa^!u^
z6Q5SmB8~x7<I}f(^aWMbYE%zHl=(7i+m~3Vka+owXD`9H!!uz4#+85>FO;>N6iFRm
zJ<!Ci<G~s!7b<Stm^bu#Egvl`oXUF^)fP_zkCI?(_*%`Qo8CVL%g}@OawJ?pQKV(p
z!D!Xrpa{Gshhk$yNH$iDKW*4eP<tSE+Sr$tn3%|29<31hneTFOW1~8#EHn0Y{pBhs
zeo3uD@2)xrz^)uB?v0$%?^v#V)IU4H>ENHb#XcDa9f0CSM7Y5KhBmNtH$~*2&QAA;
z;*2#^w6#q~n9AKWo)HtbB6zf`;uMmajcECFi}%YV%T}g4N(Hf)+3k@Y)Q%Plz&0PY
z9lGeN3%~5_muMM}iI0!hvi-EelP<h#z3(G;yVi5?atp!vvU%gLShFlI&Tc)eOWvJ{
zSuzAxj1TlD#UOrVe!8<$!$)&s-BRf_LN2xO+VO|<%F?+;6vi&oPTyL&P9yivM~@%B
zP<?e(Foecj;ZUb(laVbNYE>f9uF}zOh}a5-t0~R`DNX;;lv?0OOvLb<mN~GT0T`XB
z#@4wophE-XoHCP(wo^IF8Djn(U(V3BiM^}$4U?320%9Hvqqv_leg)xlMrco;{+csf
z#L2y<2WVV#DFb#M=<V!_v-c~F(wddJtcT@8#Th02_|C-VjQMXpsP<*XU;yMzkhWm<
z2OtePSQNoLV{QtFf!sSASOyXuow=I^pC7mu^~cR!$7~Z+8iQ;=>gis&;w9b~Ja;YQ
z_b%TrV+~S31t5Vf=e{P|ja*HOTn6M92d6tf-fR<M(QpfYOHc6@xZv|;>r6*lznfa>
zb-%$(kW@WLtjZ@(-h62hPum~j_*pItwapIj3BgWds=njOs>7qsYuB#jG!3|^wThya
zaPfw5-mJB6e6m)_+cMv_wu`=ok66=O4+;sX0eEv4bB~EOB23$lc0Fr#o-R$w^-*XU
zzXZ4_5_~GO^poj<BS(}(>_<NUH8tlBXsgvlkrJsx?6!L}v79ePZ{&{#3V0O3aGF~4
zLci8;*}S=ZjO95~uS82-G+>Cawm`YGs#7PUl0I`*Hu$i9v#H>0D;5!Z1@L*sb(teD
zg*6URptH`vQpF`DOKlpF8TA3=%V>wLmV9{kXs;Er6M#Z_Xdn1Y&0ybJUY`3picPt@
z1<g+*r%g&Z$q-{eP09T&)}$E+y|kdsF=;z~k_&@F_Ed#?k_D=X*UtNBv?TxS?>7nU
z`Q*tHM;6-r`QoCYZ`=LSRN0(m&r$o)YX{X+F91p?gNJJ>qIGt1h>B`0Tlw>c+p9Ob
z=gHfF4!YKse}j<0$!6_mL&L%hKu5a&`KKAX@8ieqGrB5N=UKY4$js22GjnW>Rqx(a
zTH*x~4O+4dabVmVlV;|Qip0Cj&#8g`MUD1yXvox4*LiMIPh_I)ma)a8_g3kV*<fWv
z1C(48o}5uCEM&kexufF6Iexq0E1DLi{M;@_ec7a6oZ;E3#W*Uo3u|H1VyE}$wPyEc
z+P!euD7!ZgKYLusp#?j*Zy6BxoomY7@*A*Tr|B`I60kNeZr@%m8GNk%VAH`r?`iU^
zv3Jqrc5f)m9+Z?mp(Tsmq}MA1_FAc?D}>mEn)Qi)o=H14Y!O)&(rBC|38JNp22ZPM
z$#I|qkP+UstOIG(Jb;#(&TU=76RxA{A!~1MpWDmx)~<7KFrFY$lsj?(M~sf$Dcvs}
zTn!6;ZWxyl_AbPYL1v2wD%#?A0DtsC7MFCc-o~_exKvz3!~xnLkHDm;oqMp0Js}Qk
zprFZs7dj)j|Nf>7d2Pq9ZpHW6Ni4m;gFi~aSe$X&wg_}kI6=nsb3SCcBM%^Ho$=>G
zUtix~$6*S6pjjQ}^*AjpZPTVr)v@XV5>wvep05h-@9af6l+$I+Hv8r&9E)U*jQW~a
z<)Xbuh6^6IwY6<Z2?{|3H<%jjroIGz>2J<b2H{zYvgrk&SEZ`)@R#@YpWK+X?AX!s
z)w2<|nAQ<I_b^iS#n~IP86OQbP!o`f!5)<{Y(lla{?$3ct>fDCa+f*z{ZfGsS!YpN
zOm)5RJZ%2u-O^r8BY@O8Py%g9C7(>wgErV<yB&c7xLukgXt`Tm5HvVZSAc#jdiU<Y
z<BgGavvbpf?w+1Ds<j}QM9}nzk`I4i;r>M3IO7b;jEpO@MblcOphnhGjf(g4^z>|W
zvDUnxuNfV)MzCmD&6HiEr#$TD7bn6>M{nLQwZ&kI3F_+<ox=6B5uhwBM7+5(X;~kW
zC9Fpf^Em|s>iWlnvRe}fGj&7YZ;q}UzgEGDI89++-NFaV7Sq!2vT3K0<czcWk2p<y
zx?83T?>3zdD|Hi4&Prgh7VNaseuW4HgO8NS^VK@)q@W7GQwRU&H~(^8_v%%H!Im8H
z^XEU5i_OQpf4pD#+?nvOupab_YC)eDrx!BJDf1G?-W!}7HWu$PD*<v=7I_6R>BZi2
z54LO@==}2K02|v|T~!4IFLVqdR_(UUXG?xuHv7m7O$nNXw6-wUwbO-df88QAsIS<~
zk>SIYL$5c!up7?;dptGWIv)qpJOW%W@%HIkVXS4VT4}@z!JfXexs7C=k^;KyUdyxT
z%h@?OHP241^3`3tl}pCf);8DZ?wva@E5+UCF8eC9#NWDe_ik^4VSLTQJ*N)qmF@DC
z5!}DO&`x=%H!iCzHV!?Yc$wm3M(Qf>-@oU65d|3ZlruhC4pl%6{(ZjZ)SYy%ydh8Z
z?xtPYOl36X>V(*c2P|T7sQWYTzZ<NJ*Zwm%%x~N=QX?a&#bHnc#hVr>^)FoTK)ImQ
zHx>J(+y4j}2hG6G2GtRd&;TH{Dd-2y<hbm*FscW4UsJ}b#w5fL?p9d`UH%=}F>#7+
zib{1iB|79>jxe$gIvhE4NS*|!!lZ(2G#6{iz~GCC30qxV-HvHdg0fH`O^7iK?FMaO
zWN-^@AA?V?-MEVzlJ({Lj*ymNnm)s^716;yc0&7y=T;4&rqG<)`O7a);fl>h!otiW
z*-nxY5>=pO*3NXQ12y3pohv5$?!7pWw~9s7@uTkTypWI(|HJyvwQ}sc!7Wv6mOl1L
zPIPdPjo~8O*`cNRx_?(?2TC9NdV9Bh*Ph9#DFYColPwAz*$50A930|6hVp5~&6XYB
z%2DV_43Cd1qnCg}@N;UZ+umP~(JxiLq}YS34C?spx8DNy4x+dC0{s4Y6hS1pfLw`(
z2XnHro+fb(k3IVN9#3X96CMLg-Pza~pEnnU=oblJCw)ltTf;%1Go`nlsYo-?CN3&2
zCFNr|;Q1-QIFs_?oTn11Zp9pXE70xYpk8D_ppZ8qD;c7{vztccaz}lrBH_bjCfb^$
zdr!!+>nV~0p=M-|zpVg~Nq-YO=B=&V8WCs{HQUjG*bM3(1I9$4E!0!-;;vfqwP%2{
zk)Sr=4o?VEm=-V@G#`bQf3k6A_dX|tnKCQFGyw%#BG44q)hPqDS+2Dr{<BZge@j+g
zd!c6?XozYs=WpM>jYQU8vwF2GYCX8hOE_zjjth?)9Pk=?f#T?tqUV!*y`C=z25$Vx
z7+ACg(QH$S_qd~=+2`BAKzHkQ9hE_1SIf3dL|FIUlyZqty6!QPmhFl5g8TB=ycDF}
zoQco(+}0SrdHp(BuY5OcB*TJ6I*QgU9{Uma+e<r+p*<oGPKo4bT2lQhJx+dpMeJI{
zjw9D2KpD)U-Goj}rZFfki6fHl-4OT`x1qpGSKy}W$)7OJ=-7JZ?AgrQW#kD#2}FWo
zQ|9I6B|Avq>v*e+wzSx6^2i-0bi68B(dDJtfh%SQP^X}CrHE1ti6AOD`7j9)gro!C
z;~f|n10T*PEjF@&JJh0Bu0fbYgG-y3Xk*iaoyif^Epu~oJJ5J&v7<55lDs*Uqd>jv
z;JtkN<jIqxh<TZ_+{$UjnpT4?&9S*?+bV%Yu$<ek(o#_{J4GKk%62p8!DLFERy3@p
zmlon;&Ak(!M%W5CNhFM1$YCsoG=$*pN+Y!LI%1)Sag26x1FwfhGw3e!<1Rannm!$|
zX+;X2oS3)<qqpx4^(Fg^9_|T{qB00(-T?v8gqeE0U)nm7CO4<G^yw}>28LoQw2#i4
z+ifWTCcmJf@}x19NfbtO0mX`jkI4MYNSP4mD%G|zI~GuymffeMq{_}rC%`cDChx4<
zxiwOR(is^ZY_4yC=V59NLjkd3?9DbE5Lq@Ae6)iq3HgM)j%=N*vC_KaIh}uF*}ZCG
z#NT@<A$HS;NDGUOGV`D%%VixMNz{fGBpb^EqMS5g*|qCB;jethd=IL3DjB1FKAD?~
zey_?Stu#<Bnb&cD<*4Jg)}m|aJ`?PF#h^AuAA3HSSoW<4nKKkv#>vZDF)=;OH0g+5
zrP?EHPxO{Eyxu$H{NDL_@D&)ptsj+5Oia=YrCNkMGA6#}nFhShPD{OB|JnLr=^(G!
z=f532&p8k8uKJwY3PxMAZyRIS{AAAl;?HU_ALlgtcBOwzsg5cSdmVVr&2C-p^nh@C
zd%Ju@ogJDh+>Q7->x}&d#?EcF)U@@|)AsBSf_Mkw9pL;tndR_(es~Z!eG7d?(0()m
zeJtl^+IrgBtxH|<Ci3Q|^BmJOlde#58&%Cpcxn<G!0@d8`DZRU?U7WS8arzgE$zL%
z>JfF_ur+SkkR|!z7b+MSd>^6xdkx(XkbI>!vn76q4(`;HMQ<!^@<dK{Hu^~EC+lRZ
zbDQ8Pq#)}|ia}e>e)#?Vk>-6UIuJ=zA2nn=2{6f3g~Wt&^p8AoZw^)K_J<^zf@nQ3
zs=U^)CQ6r*^_CHygPvD<$zA1eDP}<O7#Rzng1`UnLflJ#xpxc!m-f|gLiaCJ#sr)L
zmsLYeu&It|`}W8`H}CJ9o<rlm1|BET^gvM*4IT7;-nR>3OLDMwZuTa}hTrXV^EXLO
zAmtZo=16RyPmSu1Z*jnPI^`*A(dSo@zY^w|0K7l`_~SQ|>9$)N46p!h!LO1LI*sMm
zeQd5#*6tshE_Caui;qW`@wJ_!efS_llptniW=sdw0pm+U#9EE~Z?0_yd$^mn{K5VE
z2Zt=mqzbcPqC}RnW#>+HRI_t)yU#VK?E$;LL1gq{2OZuYwBztKe77{;?%M|V!F~0C
z#O&!c$|;VM<|sa*z-ROzPh&yC5s|M=41Jn3W&sAq(vvz0x9M#?*b@8Z?uK5Vso~*a
zIS>w(=#6y|79-)(n`3jI#ZdO3p{I#zIylw1ISQEXi?BckQW-p8A1R0k+DDti8^{~J
z&LJQ`$|E`Cr|MKAb@E)9o&JW$YDa)*BFUzMj7mXu3nUN;NJ!Eo*|8&<u8at{SJB)w
zA=L0UMM-_q8MIjx;iQOe3J7bsKXJeiMeytgr{5HomrI-E(0xeuMpIuAfz-6+ck)}%
z7RpEoB!1HS>Z_<SA0BrU`x?Rr)H2LN(ZPNO4yhZ}D_=nb42^)COq;<tg8SN=BT$J%
zfx3okt4@vQ&Br2y9!-l!ffkq9!$GP9n`SHD5ySgzyv9vOQw-~*NP_|@7^3q*)9^f0
zLP|iifK6MNn8Ja_ysoW(`+0b5%qK4|526Cb-MizED<Z&zXSP2O-h#HWzB<`hl7Nu@
zIZ;;Xl?BS8Y_UX>yQ@1qBsDvSnhr9LG?8*<hKr|w<Vh}fyK^TB3t~U>wUCjCNjc&n
z*S>vcN&BLhCocw%+>6SXE!Z#>=G2hultq|-<U<3{$z}G@%JBm~%ghb?=6OW~Q8}Uw
z6)$P_82%Niur)+-MR!Y17OJ38T)PKeS%Gw61>MJX9mt%l_^*99j;qqQaif)`;4)dP
zeHcvuCy02a&>^&(nK0X~LlPX;<Xh7Og<w21JDt-ZrPgDhI(rDZMbVrL<|XKuogCJ%
z7Q{*z3ct#v_z!haiV~3eRHN5&*rM|S$wchz>_tUIa-fYs4~C(wD~m_S>T=OIbNX}_
z8cvqeo>^FEjZrc8e#;WjPSHpnBr{>n;z^=s7IjnsnHUAki@0C&{LEUb?#eR)&6e_!
z&5lY`bkif?F5Qo%MJvGmSt40`c907E<3|;w25}J8ikB}xU(X^M0}qHm2b^HoZ^|~f
z;_mP^1_n;S3(hWy(BMIEc#0%&w64B5wm_ys$avklJq!%u8|4p^zvJtFKznHRnE(50
z84}omR=<D$Kk&Z)RYZ;7ZutM4``vm1k&cm(F%(3fua)w`)*Kgwv{aZPC8Z=MC#P!j
zZTs;jR#I_(|GIt;V!DNI-T(jbZBclPFoT!(`>Lxw&E2mweC!+?*wf`6_S8kjwg_0t
z#t#HFr52Zz$c3w~?EMmXh{_6r)k$o6nPU9bp2VOP_gt#`CR_DwUJn+P6v>%}ibw6<
z8dX5=?ef`~6*bAYE=V`PDmye^RP5_JnPw+L9!h0Zd~WFEJs%2n_l{%7H*DDcWYC(a
zHtSlagL{muCbe28e^%(BqY8D)ZY9OFVlK+ipY2X-OtAHtnVofSlK#FqUb~lSwJjAC
z%n<UiKWQjnRMjBaXgR79wQ@sWyWG{c{`bpFm8odX(3_JKcP}fo2`{hwqJK!!hgr~C
z<J<%0y7;V33VV;0u(chOV882W(DGV0lg`szoXPq9;}5Vd)jBRWeMGrCH*1Rh5U2Vf
znsYQ8XRSC@G-NtfJ%75N%4pokqn25DkZ2lW=IHgl)Rzn{Vj_Hf>-l4tqLVl8r=R<L
zVm94AXV-(7>Cw)6p3!R8{wPk0@ZWf*HRHF5p%Ir}tWZ&5Vb+I6uQOub70;&Ym+<_`
zo-Cdamzne@Yb4%rs7=J2t0uGw0GuvAvyvirnr`48p(UxFI#^w+ZNvHXqWg1$+rq^I
z&GX@WhhDJ;t$ny^U01(cos-RYUHzzs<Fw_OH}++bTe!XdUdBE(b~j|yH#lf*j-=}7
z=I_r+Gkwh8wiJC+wM_Ha5xbm^*L>*`%CYkHXTw;#ryiK~RAdBMG(TtK)GS)56w@|i
zS6UD|b$QN4T-5UK&<k!1F2z$?a>|Ee_EV<n^t1sf(mWi#dzS0#i_3X_)t`H=Tej0D
zh-rtMYWwb-I^Fu$Ys2)qS|Wpfi&C!Yoe$in<FS=n6Lnb+O@oD5@f82-H<rJ5BuE8`
zzVK}c{H?pGw4@=`AZ{)vPWfKg{o#K3@*5k{4`vOm)K|(HkIUUL(zLT-{2X=b{I>XD
z&A5Zr*1nk`-ydy)2cdX!2n1C3A-$mTDyhKg9=ezWHR`US;t1ysj_3CL{DvCZ)MVjH
zdCraV;jgmeJw4~<M$fw`t+tL7=opf9O1Ty}uv=6rq;zs>Qy=A1b)=?5bDSY3WvZ=8
zkgveY%=7z|OnJe4j<yEG=<3m~Ri!ffA2SMDAGWJDLQkveb$NJ%S`EjPvt2d>1#FaN
zp=9rNF`M(fSc25KO!dl)oe9Kl^m1YYw4bdA$$r7&>|W;?U1vCw$}BD^+^r$jJu6)u
zeNIm?ZcA6~erW-owb5#Cdo*p#=9|-craQhi1SMz}E5&kFAJMH?aFD=L`D@?N_Zik{
z)LbC85@i+O9sDR#H@ddBHqWx|dFXtQj!i*cUWJE?OS@9JO|eqO@@%R?hTPMsmTE~S
zlb*1qCXHB)G*wTL@yyCYeB{keF090(n|nC!1^Dtuu|z*Gi%mJ^d`ooViqx~zPx}nN
zuZ8Yi_8qSG&I{Yg-SymEHFYpgBe`!*Y(rOF^J-eEu$i3Ld{VJ)4tU%+!$$GM3fVGU
z-^O*N19>zhO66FPLvi~4@1K*t4ZBBuz${%A7MsVhf4?%GLt*AlNKo%(gPLmGvEZ$b
zsj>di7So0rsjbO$Wv8_3-Y+c#E*n-pjjNOjtkm2vuc&-P|7jd^LzHvSHB$aIhZ!|w
z*o3gYFE3YK*Hd8ISH+Vx#?djf(N|aT)F}nws4(?<{+%vLXRn4e4p(ewlAmDuBo=qQ
z^0<*Yf1Uq*G3{*Ajnk{Y-=86JH&rRF`K7m^K*m9nrl${tQnS=<ojcaAVXZtLP@ULZ
z!`-2#S^shSkaODgl!9YN-(?v0#%BdtjCNWL2F-3!NxWHT<tZ|Mr!gsSv@b@vK%^(t
zaU?aUA=@atariU#!*X6^b}jSJ*3bomPT0DH=ixcmypZPxXCv_3heyZMExU$z^^U9W
z$=Aj`+BAk;%2BELX+zatUT=h+n5&RAt16)LcZcpzF_^t-G;QU%o>?RexG3_Z8v}n7
zQ?#>yc6>lw-hkYo)-#Rf=aD4z95I?rfpGuZbGj})>cJZpBYcSo8dq^~ak(p3UT)gF
zxj0k!`!X;T2^uGnffVv}<V^nB@8A9J_pR<d*Ks!{t%q+unc5vTsD78xvh4*(Qz?Ff
zY8kgRjHJf^roS-s0a2>3h-v_)D?-%++#C*JmqgA&?qImMU7c(lDa}AamldKd8Pu!g
zGHV6#pSnL3zqN6i(a^!r(XxfyzKjn{A(1K_b{M-(q)K3+Wk6;WUtWYQ`I~@SZoD4;
z`c)R%@<wwV4^)URA-_AD<1p^S>V$e?&4vvSpp6_hZ95Jbls;-(e_owC&_(}7A@V86
zQDPuZhybJDYpK1kLHTP^SKE&F)xQ8r=fErn>ReKgGBPvAg4$vi6jTMJYT>gEBPl4d
zwy?0olZgaWY5@1<>_o+T=G-}yKccO!0(<wK+P-~z84dJtIkdT<3BC&#DcZ>s|5-Zu
z;yu?iR8WMeBXtuHch6fUZ3T!6i13MR|9%PTYX~q>S8v#06DI){6=X2V$l-(S@6k1i
zLKm>Y$j;a}j+8L3a~9w=gI!?8(}e3Ahgu*hDGQ0u9u_B^Us9mp4bM=i`l@B&eybpL
z4lLh^H9$}HU2(AlDo&mh>xChsr@!M9IvF=@dX5s}8rl=23}<C$V>^S5H}#=VD6-H&
zum(xwA3Ai%+uy&3&s~6xEi~V<3F9{?_RDDN@4lI|pxlvMz>}_w*Zt&zLHR-^L!=KV
zVHh`Ve8wi>bF?nxsM$$Uo@i(UvO>G91PaEA{S`E7vykMKfpYuybx|O7+h0)JsetL1
zAdiEE9|f63^aE+F&RI|v5h;<cwzDdc4nW57tuq><D(^Hk`p9x1j7X5kQ<J(5=4bf#
z9~<58-76knxe%fmOfz1c$qxVvK%|4DYzMhV2yht50WPi!)X~2;OLu|A&xGs)&m0B9
z&amS7nKeKCWLgW->$IJn9bu!;tCE2b=CIxHm!t-^g}Xn%i*YV5tNneyftAPdxqEmh
zpuASKS@rz|#|8C@1#K5cyf8xZ{p%vUX7OA3|Eb>+)US~%S5W9}#pGHnH}P>IX<#9?
zvHn-BX7qncF|z#s=hT4zw+R2gyZQe;6I0LK<^&ny7t^D_3<qd@Iv&9e1A;XXvZok1
z6lBnlB#kZK{>rK<e#Z$@MNH*Eb^($(1QZ0f+2BGL%oj>sV~b{QJo;(U%35}z#lv;l
zE}DceB~n)80FK{(mw}2$2C}hNC0!LSQZD|rv@}>mz1WwBG~=q%Oj;#!7O~gG?TyQ`
zA!M$^tY9SOgvgwx8Mi>eHPQlwYN0yI#zYfMIYQoAVXzd!9BC?121d$<8@#@~x~DSq
z9vJ6P^pf<EgVbJKmE7LHaUnW;c^EBiLBp#T#Iqb8P{U`iF-@BEw~KGxx>W<g_}jul
z2`Xt*#l&#=@_`wZLo4#t&kOJWcwbu8=IQT{utowB=%X`a+)I7@n2qx3(<km?=rDuG
zk7O?O;lqcH#kSN(kDhsWKw+-qF+yu<YWi*PZvT^eOiPMhn48Ug%ek%+1;x=5?WR1_
zuH)!cR)Zj?&yKfp{`zYhHFXxGA^{tg>cQx8flAh_%=KFFI6%HulYv{J<I~LdwB##=
zfuqE<oW5l(kh7AZ%gmmr=)hu35kST$)*UiG6OJ)BHVRT2A$tRLv4Pc~CMh(nr%>O5
z!_V~iEJ>lT54{D{2rTf}-tO3vZl(j}@^LLKtthRW%rg$QlR|wRn%}N`siSS-(qpFe
ztFl4S)}YO-;R6x$X?%Vq*v&`~&j+9iAr0b{nUIxyK;Me~;nW5S6}!U*B_`=lU;!Vq
zk^usjnXh+0fBrmd)cBvsr14Js=QFOu5gLK>-!>tCEBCZ(8dOyV5NZ@B0gS>hYcd?G
zBV_HNI8@AYc6wV-&;x<CBH9!+7`&p;j5Cj1|M>g;?T5~inPX71XFaw(OHV%vrT&=Q
z;HHJmRr#E>!FFvsM8_X6Wo!kOnKW!6sI4QzGo5{y0(zdEon0NTEe1hd1fYliF+20^
zV>=e!FJ5rTgIBkCb=Dv5?pR<d)J|wtsMI#ITd}u~gyb$gQ2x5Gz}ISlrDLUBU|lH3
z{`V_5I&>7zfaZpG-B*fHd4|p=A-<_wwr&k09S4{yQP_j_iZxhV-lCLEtFp<E0T~p5
zscS&0z?E<vWynB!`+Cd<I1#HAZ&+lmy$s(5KfgpP3+jOqi+D6?cN2XQZ&-dI^fz?0
zCJ5`Vgo1<Uf;h)lENn!P_hrvEqT@M~E<)aE(43h9>83)8f#P-@%f64iMBvnrZuSCF
z^UqxKXrFaMQlxbC>ect-i}<|g+2vK)C<mx7iRK01TLJ0;G^lcxrV(K|X>crvJ&WGI
zXEz>MxU|dwql5b$(l@}YZ53LAqjh<6^yi=ASOMInU1oc=Q*?{B9@NZK5NI+zWfri2
zD_zawKkl{7o15z0#NPzX6dL%Er^)FC<m<SdQs2f!eCe8`h#%bO73WwG;UuASsDO|m
z8c*qM{rLOq8DzLswhod0ENPb`x+fddaJ>EdZ=x9_g8&kKXfz!V5^9LLx>!dvC0%#F
zgEkH)DyJn&mOxx23zcW?#OJjXXow58F+(p25kguNW#JMB>bTb0rd_Z94Wlyv*b-Dc
z>OKm}ybA5PVJ6TO@3y@_)u2+ty6^@sL!TAdsF|p&v|U+wGsE{-BQX<3CXNO&XuBzu
zn1#Be_|F5xscs!2We9c4wrvL}4X^Y(Q8%F0+eeAQJT)su<cp*BE#ADwE3P(FdOnuM
z+$}IXeZ&*$OO&<}AYg>?4m8vhB^UPfc*a%L{6=VhD3vg$c+6LHAt6y;LI!x2ic*-B
zK>p+(A9K~Z9juU63(lhijm5_7)$t%tizi2Y*YL0V7)gwJjxl^gSPH3?kvEC{iZpwv
zFY#V7FtP>}DI{(G@(TXDf?`cunF!&JA$90IICyyzW3uFX{(I2BHvHPciZW=Z!9hM@
zmW12-#dwp2bYj|~0|d(Vx!PdV*!<|Ow+%l3^a8}ok^*8Vm2Op&THEG2({?SIizC|_
zTao4v=xyI^Yfl}RF<<zDE5Ezb;}no-zUQE(A$lCaUF(Tpc?ubdOx3r#%xjW~4{Q#G
zK4PF|Qmc1ac=LfYcjlo^`c!W`5jEBjtvXacq!kNUBauOjLcH9K*}+OrvAGD~hPVG(
zN$lwC(3=fxlt+&q?XDwzx`J&^kl8EoFGkD`f88Y}=#;T`V~kctP0hbJv$|RV5nqCA
z<CTAzl6TiWLnfRFp#+N_gPIVXHuP%c;g5Cb&SJ#+H@z-(2sNVpmw&%?SM$;&SDUU6
z&+L05!{I&}XZytA1yq8QkVbxZ9s7>mE;D9i4rzO*ePy1D3z1U&c$e|ec@kxl6Ap(U
zqNkImPIYv2grY-FSQMfjg&Kwps(}Ca;IdwfoKKApnpmYQ?#D5%oqsLjr1WGi=Dz~`
z{37i}ItdUFa-K;?*PyxR=&to>Qr8sy<J=laTy2sUE}*YX09~*nhNgd7tYPzigIi*d
zyaJu|*r@dj7c$+5-xBE-Hr9ieq<;_r9fN~Bci&u6T;SdrT-PGXT)lGTJe5@6P_3XL
zP}%LYSRC8gsw&DNLa|YBz`?$z1=Dnu$j913@y}Oq?d#{ah@FX1Y719AF3PpjKpl9E
z2nEsV{x-jX1xM(5hmrl*KC3!SJ;hfGua+@JjDXnbz1`y!U`zve{qADeCuX12Yq%C(
z<fZN-?bB;|G*E1(j)sr+#6Kp_=d&_<#ftRXSqm?`c(8bB3#cPiMaG5SJpBa`4t$4^
zqT<4DTu&xAuGgZFg+^;G9Puz3J$<4&P=KhY@)|kohI|zrlvvgRky;mGbPcq`F&LMl
znPY>YSUNvHQ7A^{I5-3Tv9{tQSAqTe&tVvfDEFF-BYc8_Vlmb!LzKNZqya-Ny8nJ`
zpJb_kBa&!bm)PX+o+S-zNF-wZE6?)dQ6OA7>XO@^+Bk~Y`D>t5rXWqT?2Szms&m32
z7C%_1{Nd}(nTqT0o+3(nNNO}|n?XtmK?{c*B8=lUYX0q+*Ow1M+`>vhK%=M6%?v|}
zq4r~x$B6*cm(XB(_LlR+18n_A@Wp7|cAaF~ub0W`9ZI%3iigTr6Cp~xV^a~-Bf
ztMQs2yg|@*5Ey}^P3mF8S}wSGu}+5YV0P7i+!;tq5^}feuu?$hwP!=gDg^~@(vJZh
zN}*(oB@wg=bZguTxfdB;D==dIzJUx+ZMg!TpP+Im#YCX0=)pN6AE4|Z$N@Tt9)H6)
zSqKEYB^ONnc!r*SzJnGSHG!gfhvH&ycJ2*K9UefWAgqy4+efLs3bSZN#Y5D#6giw$
zVO683tom<jU6E~){q+t>yb#VvklEhiOo;QzEdCUfP-F)UfIXD>7sEh@kFL!zbxa(v
zM#8s;znYca&w=h2huUC~G1>XUGP(*Nzf++D=`eEw9m|RXN>2S?3QOXB>oTIC%I-Fs
zg^+?ZXlLo-g$@Y9th&0cZPy`WZ>&~MgKjes%cDGbhd~VjC;pX@`}P?^nNx`b?B(qp
zihrU2m)-B*uYow2>^;1+_>*Y_rrUqK{vc$nQCM>h9D;)Z4YhRBXBI&u_M)W1`0NjO
zLbBomrqRhrCh}bH&f(!o3<1>OS3f?pGL`Hv6pTGS>c+Al3!#f<1Wv`B5Ha))zAJxt
zm;SSrSL?T|qoFQPB12U*HH&a?IKguHpc^u}x0lyToG9e2v=|0u;#7AJVVpr8N**PE
z+2=1_5M*kI=tlID<l0C~(f{S{?<>D24KkWbz2afkVj7Eq6GAT|+M-Ab$4{#D|3oke
zpZjf^SO$nxB`LJm&1)exQimSOi}j#Z_Q!v(Iaiw#CPG*#@MK~*jZ>(}Fz1N^S^Y-`
zg}&f14ta`AYl(818woM)#SAVR1>AkYkA6~BS;<O)uZ^UOiil`Zv6H(0%Bu*!cW&Q4
zPeo4cHJgPguu;GYr~LR4>dDvk=y-ffe~>Sib>Jc&(#_hFExY9qt0A*0`qvW>{6r?m
z0V{I&4jtmR?2;ky6Ad3r&IO>%05d#0)PhVv&WiHjrLtoD4~JOEg~12NAkvS)2BAM0
zWJ9yd{49}0@fJ)D!AzXSo5PVcRcjX0ftQ1iWW}!(AYX#pw4CUQL<@wm0Wy{jrT7b+
zf}&EtWg$A?)hn}UikKKe$mY5qwV3hdFTr+*{u;TIOaO<5hf7dV2p+!j?iWmIYd|SP
zq((6Yi)pq<1kXZdv0SDbTM^|60K|M^7cf&DVAXFFBuPSHV0IC9@k8o6a?=J052`ZA
z21$M<2?>>|gb>q!xEyqBE%v?t325**@DqcI=WeV-l}9ZrEfj|M-p$R8LWO`y=f|xj
zvrW`3%*+QVxU?^8H++YTs$1e*rt?AqJUok$@(Z#gnhR_cs6DAKAyp)94GX5e{P5v}
z#X5V{+J995%~uYBp~oR&)fhCdc}dy)jctKWK+Jr6Mq%B;XSz}ouOIE_uhRg~MktCT
zJU==#*gz!+npr7`n~zyh<8RFvK+&j7C?^i(xEM4GIJvo{Fk@{QCs5FpK?{}#7oqU%
z<O-+(C81$Ai`)w{h6+&`kI%Se%S$N5c{LZ(FoQZUC(4{;L<e1uM+iCOV2=ny2qIMW
z;Zh})PI`L!Z*|N->UCNUl3+@z;oa4t5==y^_pPSsh61fl-6SUzW4G6^K{z!{0Zj%k
zjLKH#tysJD8pg25cCO!b^eN(x+N+U;XO>yHtJ86Z;SJPGUAH!f5~_?S>M^$S9*q+M
z1TbU5Mj<m9DD@OSrvgRNp+~z0m`c*hZihbJ`^>^h-<U8Y49O5tO;WT17{7k~nw)Y#
zA8dtM0H?3<8#k%oXadydM$Z~NexNEoJEb>;dhpn9+u*h8lTLea=0fnNas}Q}re<3A
zM<FR>9yIyz^hS%*xTZwIyZ7(Eof$ASst@VCJ}PmH5hwv@2I@k8xWK0wqV6QsHV$FZ
zC<4=X9^=$!)+{2>HuKB+`Re|NRbgOc;4>JTI*+`dh*_;<d%6Kd4hnsVNj%fHR@;9|
zuZ^r-C5$mSA4^|u7oYq6E9cU@?v1c~TUrf1Ev>g9l(dga1|ctug!1w@NX)klbLbG+
zLu`8ZYRQw6-X<Rto<SJ>97=g|#2Fw%<#0#wy&CIFWU`qY>(=ap3lM58v|+3x|4XOW
zw|<P>(fM!QpC7t;<3`y&qkAH&;-L;e`;Rz1%7Wu{8WxhzQXBF3gft|m4o8_3y=T|@
z<0G1~HL>c-INa)GPi<^8;xst}uZ)g3p@6pCC^>=whhQjT62l5oM_<`&(ocgE9)?!d
z)94HHU-;N>9385pDb#`PH73G>Go2~A%`4iHwv2s@TI>}~u*mJ(Ya41Ia0uhkRMLTc
z_wGEIm4IgueIbmAjY6ip$dCbuO?I3Ev)yBd4k{k^W^42=`S|#t5RU%ikDtKW{k?rC
z_<Jv~=F|oeRtkK?8;2>STzS6<Ej?)}Ik$rJ1l{iy&!4@FHY4U)Y((=C^4RPuj9yIK
zT{RJ+#9j8iPQ1AG?Rs0p%ouWp0Rn>;D;pb|KGNy80}mR5SbpDy{v%r1aWY2WHl@It
z+(L%68va5leZqT6Y;NKO0jbC(@O5!gixLquN<5M2zE{LCFe$gUyGgQ+<Y8W&f&-8?
z0}9msv2ianvxVzw7yR#|QsS}}%(%&rt;c9`G$EVdcHGt0Sfd)uU_T|}E|^{Csy+f5
z<J;^tTEQGgkE)OWL~cUUWtL8Txj)$UBssnhC2~9xKdEKNEIN*)di4Onxd=U6RBQ5Q
z&)y+Zui&wmoC+5*NE@GQpP=oCT8@3nRvxVwT<pM}JtyvNVDVu^W|agfR6!;x$oLy<
zB>8y;-^TxjHK2((t&j<J^SsZ~%l-Z7&U1XigcgQhgTAGaMPAAEUYpd3h3CKcKe=tG
zq<qbzf{4~pX7@t>oC*B^2?yx#Q>fU$SmS?aK{ixNV30{qwjojHu7xVv-c~q4jNad<
z40uk^b3>|;q3%D0AGhj}GjA|!1m_XZOE>f|i|eh4_C>tW^{9Z5;6ExMqH|_v@74&_
zimS1AaEL}|L0ZKO&wl_<==9kr#KGVL-Kn`4mim^?{sTIZ+ym%DdJ}MlG&*7l^(Db~
zKadCGGs!=<w6yH53t_2IM*{lsuL2lEDA-0$rU8S>-HT%qBB0tw-o&(X?Z4m<5>h`-
zFk{unMGbJMi^U{jmKA2ide9`GzJwXH{P=2;zEHCq=x(}S4J^spjV^ly7K)8><Hij#
zyYnMB+6j*?7oENU*uz)wZrff;nai@JONkPj<3}_<l9-f)Ion?HaY)9oFvjkWi8^c6
zts@gghcEyAQ)lZU^|V%X$B?)jM*Ij~jgDUY^%sJT7HrK`qPTKnHtK;I9Lt%4^K_WS
zoHanT8tdYwk!dggd#kq&%?%gx5M9HA-6H-b+jTtfq931ws10y*%W2@=f^E@J|6G!k
zU&!=jrfH~E$pN8`j$C<ncP`vTn;4hG#qzruWaOPpC;t15#Zm6x^e14dUPXy7yy5r~
zKph<QvCi%G?JjtC9WpW*MgTt+9kmEgzg$wyC+ms^0w+osGK2*f(9zq=iTdAn)yVK-
zXP2K#LY*|tPz?&1Brj@^4rl`HJ7HXfjGRYDEmo2mw{`d0*2Svt|9;j5N#z&=YcgG2
zQSnD0!(h_nUH5US%r~m`U$jcV^JgeO`3i_ELP>FvLObB9yJV2)_rb|^YtK*lYB}`t
z6Keb$D`UU-*t@|6p$A6}U-H872sp&7L2wlzwTj;q7AC3gS$N%3(6C1Q1*iq_-_el8
zTNn2XeWSnHYB9o9CUUg}LDi$ExbPc>HGg57a4L|J;^M{~SYG^Js;u;6cafXpNNzr?
znojf@a@yyJ-K8dsd%QK;x^U?s79<fQ4=zA7ffn0SNEFthJU`>CtM6Y2G9-k~+~Vz&
zJF>V<^Ht)Ok5jU599*&xA{jJ<@EH~s7Hb_B(fI*QwjF;>qkl%BlJty>DIv5777qk&
zD*daG5cL>fes#4pDN1bNTCOKEUka!$KE2A_f5_MC|I%bfofc3PHbI4mUWvl9Vll9{
zN{1H<?GArTnYm{r0!Qpxf9_FQG3hTn)+KYI|5l`gSBH9da`tk6R5J~kmp`7<8(4m5
zzUgKAt2<d<U!!(Cb5~yXP`kf&czxWSyPkO$l<t^I?NaDu*=cpPimM}xc~m7&`K^rN
zbrBh7UZW0X4f*vvEFHljaeXhQy&ol<)JvPmQW%dvww7h5Hd=n)z8+qw_^IVJU%?j6
zUsm?*drFb^HLcqm(z8xMH(z*oc!Rm>z|i<3WfhUhJ2modVFJAqOmDn{l8Qq;w66!=
zbjV@l$vf`b(UQAyIBwUT!G{MHw#U^xpX!>n{FdvDc|olkH42d<UH5#}8o1;gYU1Cg
z+?~fQSC%ODWpjnf61s43bg`Jsjk>1T<Q3&d(?%j&j_=9Q_I^{SP4#+geSG`sXfKPY
zi0m1TqAc^<yBKduTq^&5=cXBntZjrpwgTc)lV!Z<;GHGL9>2!h+v4+6^YY+_Cbp+M
zJF;)R2o%$sOI6#yHFvbt>XxXtiHatLs_gcQZ$F3C?(Uy$%I7lA@6VkLczJJT|GhWr
zjOt^)E-&JSSKoj1CjRDy0{xC)(Wn?N&7ujT6h7-&nbDx{CVkv5iM1_OF4Ucz$9hK5
zHFkxD*^8OpRA1f<p~SAiH6A;uCiPhOFY@#zyY|gW(xNpz9Mc~MhwoqG8Z6paX1;y8
z?x@Synz%iAYRZ~2h0cl@?IM%6Ykjh_y`7Gp&=YWp91Xgs*$~yF6UcEm=e@4qi<1f2
z9LtNt)tK#+BNugz7f<<GuGeaF@l%$0g6CnU2u+V@=*}fR%Xb~GE@B^!tygF{QS(Jp
z@TB4@m!2e1fsy1g<2gCKT9*NhPUTmA5`N;$yDjYonCwDlev9`qxxY^+<2se~{U`Mk
zOC;@&7QY<S!qYdy6ufLYewsX+!c{x>J={I*gFtC(WYcW?@S2F2zG~JWwYjo0#k5`1
znuVg<pSQKd7sX$dPot~47%NSc4YECM*XU$aDUH>b8VD^C&D379F7sWu0ZzBM9K8gK
z>&@q)&0{zD?vvGkLV4-Y(B$|KU-MU*Jwt2aWW6-MuX(=i^V3UA(7Q*vxOpq%+2*1&
z*D!(NJgKbt3#CKu7i#P88MkZlD=ALpun!jTU%3#+XFVU$w|6yJhPgzu;rK=^=ZaV>
z$FlRfY(}%?XLGr&@PJ{-lhP8@vg^Sw5~e$gJ~<dWx47;T@t&Nv_w#sMBuf1?#K5Yf
zgXN{c_^i6>dq{uzW$W*5_L?kQ37<<ITk$>W<+I5?ceO#AXsgw-1YQ#{#h%d!*6zMe
z!6NY{jfm2lCbmi~-sSfLC0plWr5wlIEi}CwTYR)F4Fw&SZK?iri8;j1m}BK*v&zs1
zC1L`CE=Tkpa87rLPM$q1R2SQJo|cIfQ64IF5f*4Q4*lIuxo4ua-`v9TY88_Zy<PoG
zz2SGa&{+B8`H}+&4<Xr0IVe;PEvo?Xf1$Z^N*ttSwz_i}lt_z^hbE_WXqhozv^9&a
zvJHCSHYikS`czp*{W<5X^Lo3=SR|!7S2VJ9b&U#l$j8PxzTR0R%qpJyX<dhQc+f7b
zmNnO%viLSBarEBI-}e2=zGCr71L#xQ*<~H0-@its*}a$-eP3oe_rz+5sUw(TB|08W
zZ{7J)kmL5d{f9gA0@wyk=lV8VbF-F-QlE}$=hk#94sz04J=uFd1ka~#Z%I&Dl>8>W
z`AO^P?F&*ql{P%|^fI2P&}<H+N30#ef^j8(mlla8N$;DzowR-s&MiWbJ6^T3V<`G*
z-<#FL_pf*E%HgEI*XGh*2XY0q{C>(i&S9d-dR^xE94%3s$0>I-14jn^`+g3p7b?$C
z?FwQ!K&#%U%QhR+B!A8;z)UT-ruY5$&5FM=y2H8bL>59%H;#d4^A7ryU7@O_xH5Zh
z-u&|H`g7wMUc!@acCP6bkkxW#>@c-ue|kwd@{+P|zlGGU>PW`HOfKP9bBD-|g3+O+
zX1TsEQ)qbY+iV=zxp@<N$iwq?)FA(t9*!ps7WOjtC)*o*RPSWPb7GkiHxT?yEDh~e
z)jfPuD7}wUQ?PJerobfH>S{ZepU1JihLUlWono;b`$QC<b(aoDYH6=;T~j3DbivQX
zxYCav!ajZeX7RrL&bFtV9~~?!&D*J<xPHEfPjGt?MdWG8tf8g-?9YBBRlcSRBA|;a
z{$F&Hi&=`nH*_fRD+<%^cS~uyvWQ)-7bmgrxU-(wz5<oH7Ma`!J!w^ZFbxNDwMKO=
zz=Wqw1UP)-NY6bhCJjMyJRaJ|#)^wWPfs-xE!|h@c$7(ZJIv8$g6C0!W_~T$2@R-$
z?msVTO5keC!AU(t<9uF-sS^XeL|TlFH#i?4NSvxpM*ccFtm5jwe7S<Nm)=G#Vua%v
zmsRtH!QBUmI4GgZL5@ZGHo~rzqn0;27U09J8HJ8eH+m>jxHy5fq;8{*f)!G)`3K%8
z14o9~_ppPnlg6dwLCk5^l97G<P=#}2=#UI39#l*Iu-Eh0Z{H{|{eM3s)&U1|va(}Z
zCEpyUCdINw0)kLqf+kh@@gn7`Qs$@X@<stxvtraiJK+>Z4vLW7@Jm*9G@PhgaOn2G
zKKU!?SF|GaaT~xTUgS7V9NRz!A3=KndziIc>z{e||4{eVaana;yXZ|xmw<vaN=Qpe
zH;RCCNFyoTjdX~DbcaZnbT=p|-QC?FC3WVF`aZGWea^Sfe|!BNl}BOSYt1?4m}6Yy
z8rPfwT#s8!M(KB00P(c>R)SpzvNl`)DnJzgji~@yQUF33AD;Bu$nYIUg2o1eh;+a}
zdiBreyZEt@1`^<IFwxc9EjpZl$PKDV%7DiVEiQvBTphgAFsKNa{Ou{NV^I}UQ2|V_
z0YbA8kk&^6jxW$nFSnRc18^X;oA!-?LW~BGSP2gg#|6FEU%!4W*?pNKNkFP{%U=37
zvUOSqVmrR`<p^b!KQUNGD=^AmrV5(Qqca{l0k}28<8p}<s+a^7IRR0BB@3_@K$KSI
z`14~c;UJ<0fQlWElA{B>^6)M6(RAD9FHp;B{d=wk*cPA|{uqj?yH+L4vHboh!Gl)-
z*aaimD^~;P(6@%Tx7Qc=XQXK;K`ai05uqv;&=eG^i=J!pCz3ud0=I=qF@!5Z%h|bq
zf>m5lay_;5xJUqskUsz~3h=|f{p+WI_<|a!DM0(z6#;<?if4iZ1IqBGy8yBF-%C^&
zdLN2EQ-DUgHT01WPY`A`7=UO@5EWB3P-y_z&0`>+4}|y(W|HJ%Sopu>*FrR+|G|2C
z_0;=R7!2I`N*e+~<L?*uYyrt`a7YLhkomj4JS96oS^##)zo!MzJ>&QF$?2~Wc4iQt
zm<XsgJ(7TmVE~I*b$k2d*VOzgM>yS^110QKfbzuvy8p+OzQQGOv)^~rL6^)j?qHg(
zALsu4H-ZCruJC(6@r+3Vik)=Z{{H)>j0I-20*12x=?n9U{YeMr2Opo{q6=L8P$(vZ
zI-#I?hTr#`PXu%$@DAav3p9rg;NbzB{;!Ac(?ikz{oOQ#l<_`e3czx*XBR)5{P8Ty
zg#hIQu(AdT)Ehzh8i4LJ=YIO;{BUKm+BOR+cnXyeX~T!6EkFvUyyWKh9c3+`yd?k+
z)$*qBI+rwDov1_c7ic%Wtuw&HhCx*oN&*6+2}1xW0g6Z+i>JRga|l_EuL7HfF_4}L
zPX}3|i^g33D^>zMjg~*p3+(#dKGmZ~&%+z8f0}}h{OWwD=ou)6JW5KKOwEQ?T%g$<
zRQ?nYe7*pMU}J!KG8%k%;sWSFifQ8L(4#0oPsdO)pQ}b!dRCSxP#J(Sdw`?|l#mBX
zC%DxDzhB0R3pjanRMdz^(6crGo;ji*!<PY7js$`p@}MFM<zU6wh!q3<0%$i3w2vLi
z1_G2%pl6~9&^w1{XRw3;W@Y)NEAp{gtwRBjm4_Bp0Y1&s{egr}4QML$gCYi00s+dB
z1k?eBiICs(EJ$FDulE5D?+OTYj{um45v1+6xP|S^ITeUUp_GyOlSxxb6DTwWE#E+A
z23o6b!v{*i3ebZe+CqrwBwk2LDgg95QzqpLzzJv>7^H#V541Z5&_b9bpi>I%jsc~1
zD3S5=j<}c@=wF9&W?o21(GT#C3w51U0Swsc70Tb!I7RP-{FP(SlVJ)iE&+H=vdR_8
zhJ=cuP+HJ|PYDOj7qlDGWte~&3v%CtQs^-T&^j3SD5y3LD19gbIYh}g(8}?co16P@
zT{QO%7XXw)Is36YnQ}m2zcK3%Z*xBU;E?uO6cu<dz%K3|%#dUUvfNOnib2RUShObN
zMY@2F73t>oVpJbM&d@Fq;LJvyMJmBQ{HqEu0jdCNHQ;}NKJ?>9j~>mjIRC-t`A!zV
zE=4(s$-`XDbqjzilKjS)tu_EX7S~n18;F%d8EOE!Vh4~Bh$hqk77t})fwHZEIU2A8
zAmcm+>PQTEtOCFb|JUZ5<CE@5U8cQX!%By^_RHvs5CMvb3S>J0*SUX?o78z3+Z|XC
zNI6rW<#vs?{0lFClW)7hK?G3ptx??Hskfb+<Ul?;1_(DCo%<=sMCy;1nL8!FfulL?
z`gV?aYuIMZhn}Z^;h<Jymjk-kG*=7j`vDH3lFl9c1d8sh_9o>48l4<ewR21Fug)E~
z8L*8)t5GiNsR5590QD*yC};wp?K3EVNrZ!aIRoJ6BG%T^Qoni5o>!_5_QA0L-B1Ey
zWKxo*PW9(Ib)a%K29&^m0KOztX0(^f7I3DO0KEDCioP$=^ZZxt?MF`4-^<0bI|*!?
zfHR(CX$1<lpd@~+p}5y@@#PU90=#7G&XP{Z1hhKI@MNb&WazAcwc04Jpa8f8t{_Z$
z4)Dv~L-2}`05O4fv;o33lvxEr2}T=_-!5U^W}bO1V(jkEZtd&O(A_Q^O2SFvvW3Qc
z03;j&q;NnyQ3UKGXs;zGWGS;bcZ&UEL2d0u)<hmiX~H<&<>zPsJKOC=CQ-8eQV4XJ
z0oN@X!>9>W-r|nQN>4Z57|h6(P4$K@Q9yzE7fA+)35Gq=bloYp7-9x05E4)!hj2>C
zAK=)Ge~=sy>iGHBGLO*F&?13t*q)ygeul=B06$LT`Um?3csz9Us7HXLEDW4P?+R4Q
zsp01)9dLir;dVeV<X<2((C-Mh1IixdW)p+emq24s0lah)CuJTen*0-AodOcIfJ~y>
zdItztYJ*lgmbR)$a4r()hKv2%cdi0TFi_co(##TV4|+j$2DJE%g2FVV1PJV*-B_UV
z`1F5yiZ(83pGQzm1C$yJD(Ch<`UeyZ`V1`oz;}Y3fM~Xw1;lYOX8y!9k&@9p&91XR
zkR5anXhT~TfE7SH)_`X$1cejTng3MlO+mFDScf8D5`z{&ZD@BKz}-PSJ1|{sJ5p_H
z1U*QpYxTFGKw->zO%UWko%G7;s*6Snpxy%(m&Vpu;lKE=bD+o$zNHHw_n^Z89N3Zv
z&cDEhs>6f2Z=@aLvOCbA`8(AU;F=XSD=#GE!D1{2nk1n1&NT)Nm;qUN04N&vYW$)3
z>R<zE02MVgs0yqDUX&xUBV`WI4S~wIB(D5^R0yTftER0bTMOoWP*~#qBG7p0#`XK(
zZpRE9r~&vN&_)OVH8O5NYgAC>L%;$6Oq_oZH3(l$fz8c)u0a!!h(^#kr$2$n-!CA5
z4h$Bw{&brf0k*?Gn6ZS-JW$adz=HrZmH{Z25_&uUc$+qS33+g`ia0os<DaAgKr>K)
zmUaQF!gk_ZM<pDHHRb{)Mh<ZHe=o;mIPwA>$X1!-o))x_4XV{pc{os|gbM9IS#%)z
zQvMH^yAq!PQ}_r05z%zHBkTb<w`=4-6f8y^P<FUK1X@N$aul9{N?yI<A0}|q4O{oK
z{na&~+cnwf(MW{Rp79?F-F22G$Y}lyGqhRy*Vq5M1~Vwd6nI|i)NT?`f_e0Z7zR0{
zk!#`s+Qq;@=KcIbC8F`Zi%_>lpvS1@PxdE*%2!(Caze$~y_fNalJd#w1)H}cklIr|
z{u4dQiUOW4D0Ubt{Rwm+Vv37@<tYX}{}pWh8}9sn#h16D9uUa&X;M$G?BxQnn!Ryt
zNM_b!6>vJ2A`J$Y;y}ALgYZ_4f~c*ZO1Atc&`k!{eQ4X|Cq?2HG9ziG*EwHVpWzbX
zr*@!>EbkPx#{}90%c=c*TwiPJmAS3<sj-|WA7i1Xt41CAqw}KB#_t!wPsBeKddLuP
zy>h8td6-L#uQjSk8$C2(blk_My;0pW#C|+koU4!{{>t&Tg7WAIB4EMLh}FKl%<+vt
zWdA(NP=W49`M5vJo5a*954P^|$CX#G!3;6<Gps1)L6n|hI1{Fc@&iM5Xg;=N_r<$&
zC+9q+s5@#N`YNv+Z=?7`Xj&tf!xd*Q-u%|<@ZgYf>x=5=cn^c54sM0f8R)Gb)T_7m
zq8h_@zQ1%6f%B5MpZcP4Y_!asJK9+|%AJ;$BinyBaQ8EZ5~1s~;arZ-gR)(Fg9IXp
z!6kIdAqKe}N{Lt16D|S^gzhmVLIhlKCQ2DzZEV|xCfCiqJ2B~IgQZhhrmx=z9GbUw
zFJx#$s4rhZlT6P+VdzLP(!Ddn*lIY&iA+w|&~SKk<Qqc7lZxK%ur)##uu)S)H&fwi
zJ7#87l`v-1$TVQ&K|e54UYnzvq2}UnVVBe^F(#mf5%b7kS${LB{>a|EobC|a5qkf5
zo3GF!;e1KSkN$f`Ra1F}iP3g0A~Ku}3gP<tKaRcFEvDRJ>a-H%PjkI1Q`)&zNG2F1
zYVsU7?U5~WT!h%m7sf3NmJ?0aO6OwMpNq$f4>xA8Io!_H3v?JTTUGf^Jl7Xn5^I}1
zO3hQ+GcD@eF$T+q)sX^8?#egQM^TscZuYKr_dnVjt{6&&U)J@yJ9oBstBZ@jqIwoE
z_;G7!E+*TfU<+5XxMrmGc421RE-DS>8vjZ~%9Nn+bc2A3b+ecLZ=X+WYj{W-Ka4rt
zqjt+ni=(!ak#ZbC%HAyQjaJ%}2#+S3%%79VGT!TaG=dqV7%GEMU+UNZTX)6w<7TRM
zZ$CSz0)77UWSc5s7Vfd&dVNg4D;_*u5SarOJf4tfJk33<1F>Sbpav#4lt5e|*>uNr
zUoBX#A6gZAZXWO$`4Z1zkrOCS_iAjaje5T)u8HFJ^7HWEjAVK50wFnYWiMKxYXLdY
zTt)90x8kaAPEwafPe!$-e9FgS^kuu1oT^-mcpuCv<+^gL(Y~#&As#7*!6z9&Pr$*%
zn^;@VZm3F3`QZ3E1`g6<@8y(tjq^0x873hD<F$O!v-#9vSen?KyznFJcefv=0XJ8V
z1t>BZ;jg<|meaH!cE&EqS`@2WlXJoltP-7>){*%(J<C#QqS}sCHNqdZQ7U%dRO0?_
z`IDlA;hcHmJCfCrKNf7-X`cwgM_Dv9(*Shji=wkjwe;8$S!qJgclQ3D3$(9-8Z^Nh
zQBZuYZGmUP#>VCn^Cm|ZaqO|9aplg%v?;iw@gyAr(aL2<YR$E8*+`^wTG=-mk8*%5
z)$?eg?rEDBY$G7*t_i%89JVjFWlcp*BGG1-Q>d>%)w`x8BK=V|=et4%oFYQEK)&R-
zj{;ZB!JE?Js>ql?N15wDBuy-;VG{rIES1Fqy*XX6i^_$((K(;FJK#aEu?LbC9@K$E
zL^0><3Z+CLqF;qif^aa^EW2FmLwJbQ(<P$qmJqiDWZ)_;?uzeTKpvjDdloWTgibQn
zmmxEeT&8!JF24#^b-U)Y!!Z7Euc6$UW{KXcCB!Rrr=PM2xdwq<q@l-mJYN#eF%5hU
zxK=z_oxt#SJQgl{J3ivBn|jDKHr9#Ysa?3!CNjdkVE2-jahVDNu|q*$E~&lv;L`bR
zF3gl&$Lxm=#1n{UdLFtozKHw$>5{Qf<o1S&1F`dzV02#?7?+2PC)!~d*5aikT|j@8
z_d7$@0k>1u+i9k}KGwE`Oz6@jDd0)EnpEob(vd>ZVwbklqdK~lvTKOv=v({L$j3!o
z8(1c;%Iy`AY5R(s{rz;gu)CqZO!Lx84F!yu60JR7>%ps|gZ1?}Bz{^xTox|ytedXl
z^T*tnOK}gbc5`q1j8udQ2N!ZWwB%peYmymqKJX(l<!>WZgRhr=f11FnUStTh1YmoV
zZ3MRyurYiZ)N~=8%wSu4ooe1MP}XC<<<`GkP0`JR$R@t#*=Eo{g)QfdC9I>p`NmB8
z>4&Ab`(c*sTs-OW3SGEJ!!BuhvJZctn8RoXXO)UTSCIVeuz;^@D9GU(cuO$^5^vy|
zEgFnhanNNl?o~DLI~f?^DQon~v@I$$>aJuo78mv4`)*t&5#Iw37S()ftV;L<5FX#s
zRvJzR-GJ|6cNs;Oxhp7%zn!k#G-Y?p;uDR+u*8{$u;ygaOYxmBWD=`+Tk2`qIy?n)
zqjYENc4ko0R5n5lI{l=_lZanbcQCIB7Y=gspi$KHU0Uy8nK=8teqN3rBfSgj+1Q5q
z@S*FHnFBB58Wj%@5tvq5ALLtyz|3%I@^H-LYv=Y;qX3(+d<Q}d{X}ue8}42VzrbDA
zoAi`tk|~qD7-<@8r|<mHSS};1XD3p@@>U|y`0NE{kXFil&q{IVd`ZA)Ovj-$3@ly;
zhv$x8Uso=c+BQ<On+TqU8unrYfSWlhKjc-~H8253WISkSEF*YU%1AMj2u2M<j)dHa
zw~lb~Y$Rf{e2!(e;!3K3ljurhstMet`)F(5br2@j%&=@fCm5{$X6+@)k(qEiq@fU|
z=5}dqyQ;PVHWa*RT$5!rG=myaFgZ20Qu}woaQlUIFP~+PpyF4a3OJoKxv}jB2?i#R
zMzZ*oiqPTlz?aZhpHUydesEx&HQ^<)ugm4(p$7wq6v$GrN1T%4ZFJffFklhgCEqjg
zT)MB#>j$e-;eoLoim^s+Lm3J?M8|ph9(`jSf{geNL1K4%DV_#+XO4&bZ#eEibV}li
z*QX2D=jT3+FYltWbnK>$jDaOeD?kNZsoBCxwx{jku@d9aKQJ905w{!Ym2~HK(!tHA
z4lWKn&>Ub$e@wyWokR>?qk@VwEW8#@WNIO55)<eKVSneUCW3`+)SP-q>Evjyt(twM
zSGz{WD1hveac}1e&|VzUNf05t*aL7bQ5cd;<}KjCfn)8b8CE5!L;yxbZ+tSyS0f2V
zik9Km<Fq*E+T*L%6W>v`T-%ln4Ae*#cCe+3`r;-1Ny)hXVK%{Pq6P+pd4l0v1z+gf
zJJ#nC5YM;d=JO8jcM88*AV9KL5G=8yYyhX3zQvzj@6Ox6DR12o9&(NQs^q6okK!1T
zkbk>4v8zLOg?c`zY(gL&RHR<bhApHL0U1XH?pyb!97aZnAt=#u`0@<mw3e$1sE{Jc
zbLPdva4W_&+RuC~V6%BWP_4a?DZ8|h&5viz18!^=^VBEi)|Yhn!PlO@wtjyQd)D_l
zzrF&|v~ULoJQ*#oMm;MD`ktD8t)jxc>z7<85aSK?DP4};|7>ljhA;tJum{Rl)K>II
zupHFHU(>liHi_gQ$TCl<P_C&<fHl+QeM1YlpWvzv#Z|aRMSAr>q75y;=KV|%YBe%g
zfKA#<O4&1$rnMRD{Q<t;o+b|E*~QNN5Ytyb)Gdj_o?k^LhZo;V2~Z<R#m67TAiR5`
zdvIR<{E0zoJO>143r$SD@#im(u1I@pzu=>kgpvK(&}P_&Qn$eyca%S{`W6ZcampDb
zL(3aQ&a(Y7AJv+ot1^lFJ>&`|g^h5jzn5xT)z<z#giLVB5C6trOl#=>a36~~Er3#7
z34X;4z((%hjfr_wPl7v%VS&OP?=&Wg{t*k(wD7^UNINCRwKZgT={bi1EQAEf95X}1
zdg_0;cdfWsg4t7aNNkn_e~4-H$b5^*8q<AtX#I$gHC4eFYZp6^guLg#EeVFQqK|ED
zF`<;u>gf(|h>@1>fZ-ho8pfVyHA8Yv|M+QUVv7RLY@>OSlBUt;WXCGIX~!d6jqlQt
zAvaU!3~a{*uk@$P-`(hJR7*b%BM5NI!v^aD#$q;mjX30bWb%`qY?}NxE0OG8Om$Ze
zUm2M%ZJ!lPg9@@#-V}Q@89_YH>J)#B|8Pm==JvaTO(L|8Hwl~e`QkaxEY83cljv4}
z=FI(jv?;dkNg9x|<4Fr%#R8m{YhRayEnq#ptwk7Z6T3@k8+2^hGo-wPbay1{PQu?e
z0<YUNzTOOuM%N#k>dtrz!L7jn^F8BwJM&5~0fW7Z)taQ>+d{iawv~yxs{-k5wQ}y(
zA)jxYZGQh5gjPEJ)v%50kt2+b`{gVJPF>!jgHBhfB~jO457%?fwRyV}JQ@QVJ2Vr;
z)PvcVAYh1i6=Th^#qyeUY5&bsOwv76Y$XhlJo~S!=|0R;1!vpSh0tGqy>qnu0tkQ(
z1qb0qV57BhpY<5iwq9Z4y*rDitL6a_G;OSr?ZO2?0a7_%o}PM_oD;3R@j9N;TTXH4
zLidGkEuSwmD!53OPTl=A@?cQnh%m(*#HDmZjB#l-IwhOGZLv1I_#95xKUjzne?B5w
z^B7T}-JGeo=OkV4IfvnEa594M+DTS&Timu2TH!#w)G5xVgBI^mCOq1Y`$*whh41Io
z*Du@hE}m2mr1=>pFa%y92sUq*-QPqLMZKA1R+SFymTc)wUkcSM)SlxZ>gIVFHu=p^
zvn?^L`~3%r0$IG8w^^UWof<0iC^W4T3ZFCWJw*T!P67_bVmqoj3<P{ZPA-5>&fWNW
z3VYzH@Qcw?ep7xDs4qRpm+Yum6?&*bKFEiEB{HdFrHUBvGp}&h*AoKaRV~<ey0k>?
z`{J#Y(W($upI)+ABlz8d4MjWo27L*WK{(wNYc^M)PNxUD|Ju;rdf#1JIwo_GpeHyG
z=89c7r{djDJeyh3M)+^n*$5!}bMHN(W9Oxx80ucmiUAM2FKaTulb>O?E4oTqS9O5{
zLdEQ*SHuigrZL<YQNr);Rpv1HHu;~qLm<H#ezBkY$HT4gJKLnTW%ztJVC*w$a@y$M
z-2YiKyMV9a5h$XamUhvi!wy3;u6sSYrDpkRt|UDc(xkHV>UEO(O!gGVCz4UEiC`kh
z=It#}kvlkbqP{=1u$>w^OEYqLI9!U#hK1k!Bc{sO4FK+V7o9N{>YY<ASPue!Ok#L>
zsm}^Wu=k}-wT&_FeSHyY7L8JE;hAthId6!RL$}=&v7sp>eF^lMav?i8thp_#p|2B;
zqV!yuL~Yq)W~H>Ui#+i3epQO;-~N1U^xK|wcAi3wkb}EsC+n+&v(@i+zOGPl4G++=
zuRNGb!dhJ25-g}3S|kI53_N$hZFIbAyJqu6qELXZTFu41C)B^NH~*QLAyI?H4Xr-Q
zt7`2FKW?}%gWguhwYTk6^*7Clt1?SIOE)4lT!=~D4;HSX`=XtFl1<OwWY?NRicADc
z_dw<=)x)dmThu71vazS5EILXb6mLul)y*tRyg7ABlJ}u%V7Gd7#hc&ak13Pi6hN)q
zq*CxK!L!DR`LkYiL1XRD!<YFDb-=kh5DpVd@jYZ1u+rOEj&1Ts8aj`W<OKr=hR|ak
z?bnJ5q11NS$*^g^U`YN3e)+|85krbt&*3Ymh`tnUH4d!Hp}k)Z1epcSiAM;$2)EkL
zk+v2Nz0~lSJ)<5l#+iA56=_m^R}<tTX|k!dRyYvBOs@O2;WAIl;%3ZnTV~*hq26QM
z%3dIOhMm;*<5i`G9(}>W)Ld(J66uSrJ$~GY>W=b&cOA!_<UYhF;dC`fJlmlvO#%Mk
zK^570p^<4#U(U)4d^1BxQ<|LSfuNHsr0G1-^z86EH>BxHq^cdJxt8vey4ihfvpN^S
z_;=hH2YOZt*?ZZApE+LD7UxVPM@BqnHvrBDp2Iib1uA46XY%e=p=DhK<69<fggFfn
zmPuAL)0&=^Xy4ZHcq{yiq2A}F_u!faZ4>sb^o@r51E%HbIC0B6<5Loha;8Y78)b`<
zpOiV`Az~}>&zfMq;j>bSG4Bj$HuSHYZ2cY0-g@1cHIP14g(g5g={)u!v~W*yb%!eq
z(kY93V%V1j_TEpSow_&<ALcFyq8;PC$qHoRE^24|4LQTB1e+&YZ?w8#AQg{@{5uW3
zR$b)rX;h6I1&=H6WkKn8UUu@;hp7wF^!O5TGAov?LrrR@?wZcY9P+sZwYLwbh|lgK
z4)#J__V=eHXekv0t}518aw|g|Mf@j^zP;Ahw|s+4pi<6y{B)UxK<#48+JOcPxYC^%
zV_@MmeKR%hUbP(ev_r_q1vFiVKOYr@nyPOrf0(O9LL7YgP;~1(`;1}gI~nP(Ygsx!
zdOwEhb}>|%#_cGZH8>P~b*WZ{tDpoTHASdA71YFZidog#Z1Lx_m-Q2Vwhi3Gxks(F
zJ<miQ(>*@}-;Y%sXZ`Y>Um)$vxuVhMtVVj*anL2wKCv*3olvA_IVs`hX#MatEMbd^
z!cR*YkSh$#Ec`Oy>7tI_GcF56c=)$9`_v{*xZg#u_Pz;ZaMuf~zbK?8y;Pe-Gkf!$
z&=^PdK18P|zKCIi2J-X~LE%c4?$XE=#8aGKZjegHLARX{v7x0RJ#AlU>p(hSOjd-{
zn`ug>DPn4EQObcAm@cN|YbpuJ$J4<(@1BLZyVo!LoW*ux=51TJtWGo?<OBQ1do5iC
z-TSb8yYU~5`<Q<qoBFwEVfQ~Cd75l3QKJGeUMIF6JIF{Vv1UG&N<D;r@Le1+<WnTk
z!lDF8DK}dOxYcr(g)d9wpS#jhWgZ!FxT3Iz(6@dW#tF2+^w-Mq$)ndZEuO-%d@htp
ziOF#F`AI=1PA>*D^nao24FcA6{;}aos^pMeAIn|~!Dvd%2#mKYR@W2jZ?pG^<z5TC
z$t0>P*(()ZxsaF9)!uvzX#$h5)Ewyj)dZ~BXM=qrg@cP*7=<q+iJWp~pu@m?x#wt2
zP7M=t6fS9h6`o&PBja+V<Aj!+J<+=027U<aGCtDd#b8tq^Tmyq5#EiIPN-OOT$qGi
zVIY4LisV20vUI_-fq%{Tx?-QSo?n#R@n))mSShbEa{lUS6GqA`l$LVv-THMuR~53d
zV}jp~M7tIJ5(OGZM5zcZG`z`#Der%hO}^<WCb&u)_XZjVz=ItFm}=7&I;nV>5q`Ax
zxVP;XP8<jw7T(44F&DYiqEu%Vw&7?yI^o5wP75PXLpYh-rWV+Ntwu}QaL$>uq#y@m
zELo8Epo|<SyMBtZWFUIZ1DDqGp#VAHNs$YW+k^$I!z0r6)Uwj&EQS<Ak#Ob0eri8u
z(NHWuK1-{awRdyO3zNYG-muxLY^Vr@Fgo#qSb-4J(Lq&IvA1q`7h}r{8rVnqOCgab
z68q+5D;GTYqE#ORDkERp+j)2rQDT0`eXCobwy_r~+;MO~0xxuXL8>|*fFJyIg>}D%
z&g<{1L+lAOu>E~4fBu6TKsO{Cxfe!=g17&)EH(4i1AXjp$U@!dm*rPVUGX<=>6uA#
z(-If%9Wa`#i|o?0g>Or9`DHoOc}#KV)%1$;?OAP9?X5npicO#)zNtJ?H{Mh)?WmZ#
zd(#ZupcMrx#<}vtAGE}<({*xvJVaM{<wEVB#4~~x{AH6!D^9MFQj#@-#j-|m)ny6?
zU*C8F_Vj^s&U*32v9LYBT_||H`{~LM#Klg%5`;B#@xeRo-v5)5L<v%=MCM#i($x}&
z*G5U3877L@+=q;|?=i46*V0-bW)l5uOQoMl^s%$Wcxj~VB~SGXd^X;Ly`AMLsi$%F
z1k|OB4>?#dQYzdh-V_7>zy)_}B47i_a36F*`_A!RWWsM6UW%s<9)dN$8VnX+#x7H9
zq>tmrYa{}F*)F`I@q%xoGs$*nAgn<PURPb8z8)TW8bSPVfxRZ?=OhH{e;+M|b`z-_
zs$*TCLIg1gw6a;T7%oj)b=b)nnUHxRLPQ+u-vU5`e($N6$^8U-0^1NqCKjr4VWst-
z&=BB!5{{?~w^Abi|07;(X5219UD#%RAx$13LKVTqgH|K+#~hT@<T|I0RZb-eNkg{L
zqUwHFCe8AlJY@M^?ew&S71%M8!+8L%-o3UxP56izSj>!j^{r|z)?VsswY;wt5K0~i
z<W3$L7;JRNDJ+zy8Cc{v_QM*-(zfz=P>u3L2)&qcfjK-lZal@MP4{t-qTapm4+Id;
ze+PSzAGArW_603koBu7;dk+H%HSW;yj#=l&ONj|$S8-U}`<nKgIb8&RekznIAjf)I
z<Hy$eX>+IR#~zBD#90>bYv5YHcdm>xsxgZI0SN+l9ow8K3mI<za+MRZ{vN_YPB(m>
z3KFJ@KVcv0Yma6S_j%S1qJt-gx~{(6#E&3hxN1>LtJW^4ZOBq5ekl-O>JN^g1o1jP
z(JYMmT?{w~H2!<OzZq!}Ds%_N>vsV71Ic`snNT%vIMUS3adDJL=F{lZ8?cLhtB#Eb
zJh-^mY*Lz9?*WH~@@7w7Vvsiv`$j*xy=7eKX{gJC()eJzoU<I8rIbg|1xoQ*{nEwY
zzD)r_sgSEL$FtDUEX5t*Go=Jda3Rd~oe}+cc9a#)sl9^waYy?z)pJiQ_B@!g&WFzC
z&u&63dWFElIyJ78`bA68be3PT4QsM@rEa%n8bbEfFG+IhR8%Fu!n1pW_XeOChbB*8
zWdbkq%5es^-3#>iv(cuoA4kAV@$(kLk|wLdXqS_i!)`7%2ZpRvT<>mn^Av-yF`%S*
zftb1S8>`r;K&*?n+UJF~o5H^WN5$&zTs1@_C=9D??hmwR9gPBPpOGM$euUe|da}0s
zQ5CNe2lH9fHJs?@smD_hu(uv;z<oCh)#F7WY2iS@@Xo!j*B?NvyN)x8G9!`@Q!_&t
zO!BQLFr=e0j#>9+4Ol~3hPFAq8EeI~k>i9fal#i82mo7N*r8jX1PlB1HcLYwajP2J
zFZdVw4IN75kQ_1XXe2q;bXrHQoE*m7zVn^T*#sAt`CEEmra8Q&DQLWq)nB6+BcY-g
zyAP~x=#|R8@i8M~!gPIVh9xoEX-M1X)?6YPEhb~w{1rF|@ClF+_VxD{ri#!7>?Vvg
zKP)FugvY*n7q&q8J*dvk1JV|T{Ri=fK;#Y%9HR`*#nS=&*5@x?)C4#R-Fn}sndV{E
zr%CPz5Uc`B5!0I*$}$=&V20g&mR=yZwqz&KTHR^@p{f&2`QSlh+s9_<R7P6?!DfF$
zkWyNoou?n;Lz?~(u;$Lky9-->xw+UwAOFnPT9i3O?>2ns`~%fA7{X~8a3tAh-r|?&
z%M*003_J>65H#s{Vc|40@B<a(c9bfQC}M1Bw^-mk4f$7U^@B^<j&l4!;;w0euA4ip
z@%o*AT^%pmn?ZO$fMg?a+iw<L69DJ)(rZ*<fd*nRMMYdd%ku{<d=EJ|?pat^Ks>=&
zygGnRr&?`82_)^90Ue4LocuWs*bu4Lw~IF0<mbVn@`n8@!@W%WQk?*3Eb@d<>v74;
zMuAyT&B9I98S`k7>H)*HSiTgBF%wT=ssQQnCvW$RRA=A3$cYK48rk7sQ}>WOJn8%T
z&@b8s;>my<pj-0llU#N>OM$!(%*fPh5C}s&Mcx=e7fPr}m%nFIXMT5fD&}L`{7Tv_
zD$^`~w*X*mv3B#4M9=A-fA9Ny7_3)>XSSNHP!*M<8T1%cJ4riW=1p-&#WHz+4`RKy
znvSSGQ@|68XI)P&!|af#OPL<_B%=FCg)o~#Nb>Lbyd^Kl$grVzpljf5#Au`@_Utqi
zM@^Z87N0KJwdA$c!!dLx4=B&7Hr^XAsT6ip@kXkR`w<(~j*w$~=2^MR>IAwn--8oR
z5y8=GkL_L}d4cx+c_69L0(yl#fqt_dsNGjN?8LJTanjMD&bb|-ulA*U1SdD9f+p`X
zaQtx*Xp;uUm?fKXYjujp>2W2{JQ0Fm*?{O*S-5Yi_CE{O-+EL=fU1r9BA^A-7U{VT
z77N?QUx=l}?e)ajIp{J~KJBJZTnlha_~<XMTx7VvYKn-RK(H363QB;T`X%yX(wqiM
z)mKLc>MbPcaizN092)HDi?x!CdWQprM23CWM2*A=;TVfS<Ot^+I5zor61%EDKnq^y
zSvNAdmAn?H(b}`#4b27n;xo^R8CGZv+po!zI48cV+U=^??OV#4fk@zm$9>U^B`|E3
zYe3`Yxs;SB&_zgR0X$+LUUUa^TDJk7cMxDfwY)BVI-H|k$p}QXi-C$pnfcTxK`Jy7
z0~MT-!$A(!ZDmLk+``Vn7kZb>@ns)v$pkNkU}res4Jle4Vktb}Q_kKs%6cmXEEck_
zv2z`Gf)>#`;YVyqbcQk&9@3&x(9TJ$C4%mb)L<q6BV&>Bo^|2?I3Hg6cX5vxGORc&
zs7b^sC`lo*b3CvBSpe!$F}CP8^{PeJ`!#3v>v*Gg9mw~$znp^`i=-4OXRqPGB*_Oa
z5yXJhBzw3b)p1y}J;tJ|4Y(1%F2ZwBA@>9Viv<!d@RRcKNtZnn=&@s)ezhS1ff`e%
z)*fV?kuVUaf?knzoaqMwnzKQcj22C^KNO%?TD>=*C=A=+k>t!G0IZ)}YAYZqhno57
ztNgexao(5RuS4uVp)UmBR){Axg^OU}pzcP7^izPwQzZ~Q@O#j`R6#Zp>4(r$Me=k;
zoiPQf1O^X*M?m0;L_|Q4SOY}DROP&dogGcHq|dQZRN%jjvr!qxZGg52yUSQV#{W#A
z^sey+*r?J6>G6Zc_Z~ngK-}T+_1vZU?0qENfEkNtpV|mzM%U%CH$j-04!`%wWCtW)
z6vqh`UCj$WZ2RfT&q`+CMQae7Eh<F{hZpl4a1OqPR6k9L@Ra0w2NE0Wsk3hdtj1yk
zeRP#y3V7085P3;fs^G=`k)7ClKkx5Ay_;uLTDWL-GD1<vSLK2zT7`J8#_-MSnq$7v
zIf?dtN9<BR&Qmv1U2c!|>-q7yjtBMNf%a4|=c8OY0eo_wfC;;rq_%z=IY@*6!IibT
za|HkHJ-9e2|7R_=^9k=knWT|=H|B1gC8yKif=IoEP)`xLHK{{pvZrU0k_fHah|7kE
z;PEj!^M5OAtW`ZRI5;&3&}=)6Q50lsJo3Az!QZSN2JJ8Yp2$@yTMY&aG)CZ1)KvP;
ztZrik(q`oDpQeEHFLxr0<UK%VAfKv@q}S13JR%Ib=A6@Edr`>B!V+f2bUo4J(9LSE
z=JJ3S4JF`cZ;arbnJNEe&!li4KI!mVly{jQDEh9{#g#K#*>5!GbXa+|$7fZQ>O1%e
zoqU&!dnxhF4fFZy(fQ!w7p`g^7Bd~8g{*xgA4v?RH{~C;p`<7S=Gl+t<2{Kxp(61F
z2H~P0@)0{bIxQ!Ud@upVO6AFYB;xq>w0)UgF;zeG_a6(IyXD{{w-W+2L>wIM`C=8t
zkjq$aWxjW)MQ4foo_ZCR=(M3qr-HXRrC&QSE0Y22L_}dP{%L|Mp2s5+QMkhAiQUyf
z#vhs2mrdNPPCNkG^MvKI(L3wOLXW4hiQ)9_q2jniL~iZon*7bKOREv#;aGQVY~^l%
zNDiC%q++ffM?zR!+y?V|PSD<8(O3s0S9BJ?z8kczcR9A&nPl%+v4Ou6y*q@j5>25J
zsqrow1tlBS;|9c}x$%f_a0fawj2XEX*7LFQrx!*k&Xs(mfr}}0u-JiA8FerBngqX!
z&%NEK7J<7TGv4P>D@~`!!OV;WH&7fI7Rivw2}{~e$UwrR<l%)RYIer?E%_#AO5Gsn
zW1vPrRwpV;9NHnv@?%h(vf>gT5U(XLz3Y%>`P?-B!yIE$U&S)s)Euak45G~|H`rsj
zToJ<b4X+2#`Qv`)I>v#JY1|L2+!XM_nXo>4c#cIi;tZc`f(bz|&CgpF%bHncaTc<8
zOct7uFIR1K4sQu|cc6Vx3@Gi7QxlSsf&uGt5r}fZLx8j)ENv7D;8ivQYBUT4@Y>se
z#wR!vx%TzNs4-i=G27rl!F%Vqp0YPF%}R~$f)pvQuWvmqw$fc2=LsBK8S#^^C&Nq3
zQw(S8KVG=mxn#6D8$9Wp8Q*>?#s8Ci8w;u5N!O%4fmC?o|D3GxdRMX+tP@5Jispob
zg!h0LDA9hON$V>(XMTQb>pkFl*8#0bC!lGCMNAwFx-Fy<IM9KBFFvmmv!}Q87~mHM
z1L9-L*x3E#<YXrx{tG?s*`f$qZ-8FQpYNi*!LRAIcJ9ea`#BHj0{bbedc|j#mQTa%
zk=6X}6kKgC0&wl?3N^VbIM}jKFYZ3`LC5Rmi4Xf@PP)3K#YlE^8hy}082~A3eEFV6
z*%G915Wbgme&=+${4uZ}L05Q3H`c?2a+dpqSh>uDu))Or+a+w^JO%PBP~Z6k<O2r}
zf(>wzLAMwEs}gu1X(OzqMFLgX);BbyprX11nDo90Q#}YJfPt+CEEbKJ8<#2q8O&ju
zQHr}m-=5!XGzNa7)e<SBxy(B69<=u7LTvp)?UQgZY?JN!bctT;W=#@g(MZ-u-&$7n
zuruqg41+-maWCZtJqhkXnxCb4ew}=g+)7iw!}{HE_-8DAy5FMA1AA(GV?D)JJbXmQ
zsztpkL8ORLn|GZcMb(=Bs+1WtMZDgss;<@rXD6tZ8Ow?JKL0hWqN1m&fuoqUHB9u1
z$>yD{bB~`5v{jOTDt=XDN+3d(hkvu7zkFs>ze!Sh&Bfr$h2S*pX8lU2Rr~d{;d0rY
z&P8in5(9X#O&s$Mq@%FVJ}0uX@TO9S0IB*zH?!<Fn|HT-h}-l-?#;@pU@+P;V#$Q}
z`QX`kh0~WZVmQDJ0TFGDT5rF11LHVrlrRKPIf%Lz|3fs%V;ib0*Vd#lKrwsC?K_z~
z0u4-fqqy0A1ktwhJf!_VN)AAV+iSr6n`Vv};C&zsJBdo?^1F1OTl8#F`nSK3pw
zL8Mf5a=-(yNpjFOWt7qw!fS^#xsKvhy~|WFu(d&J9tfr<ca_L)aqeG<;zdx_i-6My
z0t&e`@6|rg+1`+{Ie+Om?1c#);QC}8ck!@>@V3JFdqn>Y1pNV3K**Dk5sH^ynD3Af
z@$fO}Jvl2<o4D_tVf|O$w^WVWPs=THV^4;7nzpe~Ka=PGLLk48;Slhmx1c!NjrlLM
zDN5OPPR&ZiWMAbF8_Mbcp)c6g1OuA<0jp#8;bpexe=LmwAZ3UxJo8zo>I+}2MEd6M
z?JHLE@Z_^#3q$z?l8o0OcD5WONS1rsq3is=m{zwVsbs=5OaO`K@!n&)@gils0ZD4s
z7QHo@r&|JcTr}^xl3Lx^A;Iuzh?Rq)9jSF#Bk~`UQdH_Ru#qxm#(ijd+!C_9^t?kR
zK&h%X(-ah!H(dkL{It!-B%~s`=Tm^F_^-<bng0RbEi-{RkQUFP<j=B)F8qJuYJUwU
zsM6Ei7T12is|N0Gkm>e07+-8`L;j4y`fSmf{=>Z(QeA#$qUh2rNGUR8ezX9yj#`RA
zQQ+pZoO$;WXOzym$jAs5R`%>nXru_4*Pjo@;5blTv$F1IHBKC9pO^Jk+v`5MG?QkJ
z1;@eS^I_!l#%pi8{Oo&Po_!uPB?ZiJp{Ly+nJwl}Ob6K^EFFCHpO7&8a+QgzFr9Hx
zv~TX}RYhIsrG4_aeDmnzTcnfaudlZ@?(o6)83EBCo41$uoCVz1RE55HY7_>P7@AjM
zx*^3!n@ife+wk4K^^9M`oVFdnCZl@&snZgPp*cNXYjn78-Hp1|=Fherb)D<APkN-C
z$VKMTo^MV$&fG8ABXt)}^HW@#&rV4(+AGeUsxl_}<%*YyRAa#slu|Xj{RkDQ=3^%~
z8P-<~A@x$9dMSJMQ^o1KSjm)5UzhKBKYuLdUchOB?fhuPl6iuDg8*@xI}drp{p-QT
zqN#;@L**TqupQNZ%~39e{tHS)^mswdLh|ibam;2~j#EFovejfc%}@-SaP@b0i`q1W
zcMl8650A*u?%-dmVqPgQO;>#6*?5NJHJza?IA)22>m}s(v-^C()VTK8pQX$tZdZFM
zjkJvKCr@N&*<`|4`IPQ-ak(td(wsU9rBlx{jOU%2VpcS~B*e(o9%S2Z9v5jfAT9Ma
zrq_^s{NVXzOmO3=<H{*B>9m5rRFG%OX`Tlt;j^27yIlpnB+64S^J^E8X-Q6cH=WYp
zbG*nUh_rljV*3tROSiJwXi~#CzJlJa*UpLw&Ex9r)X6f@Uq+~e-L+41)^mjkA@gY6
zyo*zpoYu}wWEx-Q%dqj_&_fd$f^|nE=ZpI2+e42F0%rlH0PDWF{iIqX6id<#jowpj
za?5Wl_>PyzH)7pn3N$b9;2<4v-k&V`tHzI3^#XMJo-+j&n?H-i*g^Pih+k>x_cmRR
zV#?<F!w)sib#mj{Q~RfTPZph<Okg~{MSn1K8lO|`$+yEpx;o-1N5g&|9X7mDLDFwH
zy$5NEj@QUNS$6pwpdIyG^?Okw5BiYTjC@>;Tq(-Nv#ENfNOsd!hhr3$%tjPfEk+2L
z<?&5u<!gdZvVsDe-&iOeC6`852*6wj4b`E0dapeCo)y9~9A#=h2u}N9XWpG){Dur+
zsU~76&(v6=V<k_Id8tn8O-p11<!jwua>e;7i=jUUaWD*695Jgfi7_fMG-=aGt9ywX
zSOtV9mt%D6t?m)9QVUI0Q`<CX!guKJKj0*=Fn`_U#st=giZN>mVM07|9$uT~6w2b@
z=BGEa4_ZPohmv;ywdjrPm^n?k0;dT|2cGB5ovkRzj>ID>vIwD9e0RZeO5M64!}V%5
z2q~r^uneJ7Ts_(qHV%4TG*!x?%Wqw#^UnW<A*!p~{Z5o5z2dpmonL%I@Z3?s!Z3o7
zsyh}x!(7js98cW9Jn3*bqfNYDgA*3K*?tOawfe&J=KV&$R^T)d#4}ULwL{UwSj`cl
zXae!HUQ5Aps8!S^AVIid)q`1KIHLCRJU$d#zB<H_Z~s8Uwsoon4AkdGr(Wp!uA(Ya
zvd{Dsq83i3@KjDa-$%b)^uKLMuOGwuEbusD`*tFAe=F^{Xk5XXc-5hKLaDDtJdKD}
zQ1lk}+H2p*47cQdF9L+dR8(Z_rkST9=2!hS?qH8Wej=FQn@tiATaQ|EnI-l1#v5i*
z9yIBQd-8mzUag<rjF13#qRU-&Kbp1Ja{>*5B@SoP@Cv>WQ=oCl$&$t-g55wrSiZd6
z$e_jLd{MJqFzWta-dB-6PW++yWCoZP8zxJA5BX3lc8iO&VdPn!jdr)6@HP!U)8_@h
zcpkUB()ZxN)Y8*#Omlr~A;PN50v;y7&P`9R#DmphZZQ;);|-we+69&blMhChh1{~|
zCiLP;1)K@*$BHE^NEI<7S2xJsRn!@;Udg}z;PlS-8zRxwT1%nW4;>fh&$2f;{nfWH
zKxJ6z<u5wp?UsOoeUH_b#^l^Lq4R~S)=R%*y?3>qAL1f_Ljp_6Z!ZzSQw^?luaUy2
zbEYq-KFWITC6Z6-vP*4+kZOUvTgCFDfFqXRJ2mP!BMuju)Q)?;QmMX~&V*H%?i#e+
zR|{LNB#1MAiwYFQkkYU-eQIGK(MLuZHm)!3e&D%*hh%@=62ituJIcZ7xc=d8Tzlfr
z!i&O^#FKBm7FN6Hnv;~9xl{u44vq&Fvh3B2bZJNlnU)h6_08*u<$$4}CX9DTS~x!>
z41J8dAICySU^^>1+b1BLX&cbq`mk%|^!4Qh=0<tNo(@gxL*iaSjzS+W;DL!|u^4+k
z>Uk$ciQHb>-;Pq>4BU&qXP%0L>{Ar0JN{#;=OS0BQe&}HiyJdeV?mb6)-iy#WYv6X
z;|`h_^!~9QinMqUhf>}9*(@~~pUAEJV!T3^wj7>rcbDMmbR}w3!bf8N^Ko5>=i1rh
z{^NBOS%C#w8;{G1j)rCahJE~Nsf{n{ZExv~fZL6Ou^&?2f9uYzALPB9nQ6e|Bpn-+
z?_3JZ4|7)}Kyqz2l8@<rrjIKs1}@6_GhW2%fNSlj?T%{MP%O^tdIXDt$@`J&1<X4$
zFhjG%G@_}V?Ko+Bv=xLl4VUS%ak;t*XZ5EW=2M-=$^9qm0hjiT5XhnO)mQjE_rSj*
zFIrIoHR2ktR-F(&6!jN(MJ*WhAE4us>-Lu!!<{0M_)m9d3I7~$*o5g=?k_VzjC-N9
zo(N{W=1q6)OF+T3KArQ-(9vVF_o4EOsD-c<@Q|(L`9UDyiLeZDrYG%T^;u#ucYIb3
z5yppx$UfYGh6lM*NV_7WJ~c0WYD4xcKrG;UiJk{jOT79JQHRSTv;V^z8*>)99~3l-
zzCf690qF7~p`wboxz&}n=2%IPmfJ#u0r`H@+9YCFB?|Y(HH$LQn~H@_8l!;Q;-e$k
zQhnv8Egt;%Oa{~>R^n;YR_(^ti;))Arq1fWZ3Nh1?-%c)|B2s3;UQ3$DLXuPpM#Li
zTyNK1P?6$qkrooa!mPCek{x1|DBP_>hyE7!{-3o`>vwm41+=p6jg9M2bR-E~Mx2WW
z9<Ui?{^nNymmmC7MT0)g|L@>0=&yMN?8a|@r6B+Jd|XB;9F*H6-{m!1{v+_6)wA@<
z2P7t3+rnh6I_=eVI2<W`%|IV5)q(io^Z=*Y$M^;l<0zYS!u+S<#$SV$;;N$c>|2t4
z<wY~<w-HO2LMM>-n(-NUq<R6MD0t@%?B!I^04vAKQ&p;HlFrcHmu7n(li80k7`%BE
z*EJ>m7{hjBOBo0*3h`c|`~nkZWPZ&$m(s;1cfj)Q1RG8?ac5Is@v9E@sq{l#^tw+9
zoe+r6rW5xg$D5ki_Xf{cuwvfaffz^HNNwUn1PT^OW)N=8Cd~Gi9dIcHYOPrD9)A>F
zj@^NH{&1s9Hs3%51xAB?Svs9EwF4^=rkv}P`?d$oA-IsH$)O2V?sRTD6E5Ci6kgde
zoH>#PuB}R;Pj@g!kA%%V(CgSxRCiz}s0bO2URiOE_$pDChFW6dxp)6E@D=}GofJ9X
zpNT?v#A-weLYtrE2@ZuOu(~oC#fK#tiJ1$aU)pgBq|IW-P}ldePg%2Vtd^je=WeBs
zN&C#~zwN^+!*mR2e2E+-e5c?=2pJ}xn%~C0C=ThF$@v85?b}t~Yj{r%CNOJ~Fy*6W
z%uzr8G%;ZR1q-xQ95`m%K5F)qIZ20we0CegSi5Um@Qoy3LrJz1<~{K`PC<aMR?*ki
z6?#^OuPe=lh_KU9*$a8%4BG8)e^p^MU~V_tWxLW!%B4=KS*Nlv&SjRk*6MT()C#Td
zQFkjzOxl^qR@Aq@k<fi%+6vVz6Dp{h*!%d5wRlH9S%im_Q!KUNS9V0pbGx)Va&TGZ
z%Q0Zq@2<c=0=wyBHS@+g2J)gwgh*(m%t$?fdC||NXl2)L&$X9$#Na*+GZU@dL@4#8
zt~h-*XUzA-P#r79T*xd4IZHu$#YOwqSf9fFdQinHldX(pi;zzLcZ7u!gh@#ftV`g-
zAf8_Kyu~Mq95zxRrDo-{?F98|D?RXqJ&d8I6)+Ixr0?Ru>NV4NKPh(rqkT`+%sF;e
zAFJCo%<!&*dA#d}>eqPCBK`gtX-kO`t)60#4nUqJIM^x|Xi$knetdABwFhIzhcB`!
z)Vh>jw9saKuPqnV0p|NuR8S#iW}22KVXkwoY>%Yh$%uWwDQ@7Q+|q_2e{3aPd7Wig
zV7A7{4>>(qO&K;68=pdDm;~Yuwn;0F8DHr&8*7?WozhNmA&aw5Djnt*HPPnH>+A=o
z6lP%NbIJa!I?Gpb<Why+FDWC!>jvIF2&kb-XaWmI{-|Jo43D?%t7w(pSd<&YGfO<A
zO~^w2if^nNhU~k7-!Ly-iIl_kyT(^<9}nU5RsMj34F9mNBf*w4IC9dnM6=Xzs<%l}
z3z3z<L%T;#dE0hi0;>98W)nA!!?Dc^3xo5<XqX#iXrPuP^6*(<yh~1U^Xq43CCCmi
z`A?JI#i(7tL2AUE1@Fw;L?dWY%w$j!+VpVbb44+flgjtu%$PdOKlg@tSFNo7z`Q>X
zZ(VChBsaonmC969(fPQrpgls`Eq!TR|KZEb*ib!2{Jvb*oKSOGm$*3A9I8v=81-!4
zfF%;JKXmK;dM=ZhI3l|bR?q4^z2hpeXH7(%@`yLbw_#KEWJG3<kME5p_X?Gz+~F&v
z_O#4jaP{dlX-Aw=2)!;mwwsBxc^r3X$x++HL|xjok{lS=mGF|XHQTUZ@Sue+XWWV-
zYj|g=<og*HN9}SD<N>_Nz78ML@X1({WSZv)W2kw_0(eJYpQ`pO-MU=FV2*4Ue_Q`|
z4ljv>yZu?wBu}t+1Ai#DYBB@>GqfmL5G}zrl`&e9ieH+nJ#x%gY*K>zDZV8)q=L?w
zK|~-<81e|eXwix4%c?5zrX_cb4{s^)F)SO>p=`6{!vJ7^{saCBkHs%tXbGw1rN}69
zKXCijwrXnbqx(hj(p}o4xN(r7k-JbzDSP2O76((}H<TmxQO`VgV}CB7B~_s_Os`@=
zDi^sisk6D+G^Cr04c(y?IPugfgDaxHyPu*Rd6Gkh=%CtHpJ{2%bDDcGys`(8HEJd&
z$g9wPz2!!}!+a$x*V&HLhEW<!)10;Q84qKjqJ3X_94h6zcYzw;f-Siqf}XW^KXNuy
zEBYkdHP)UXE@-to(|LwcasLUUiwW+asdm9#^E|qNiW;8lJyEI#u1NBvEu4aw@Y<Nt
z@8j4phza%c@$7CR*(-UB!%$zy^`F!rDzQ*`!OE;+qWHiJLyE(zVZg;H8xJ^or;Gvt
zFplZv_T~;=dY$4LUCa-s^q*D5pn%;i<I!%>o!O`H`d_c}5Llf@f)ZFAJ$U2ana2=C
zeB-x3Syr#I0BM?>!5{QWjxwvppc5W)wyJaIEuUsl=I%TFhlY0OcOdJ-Hf050T33&%
ztAH2TPhoo4y&fAn<Hmo#v=&i_k#4<IMY=w6o)7BWwoIdBz;+0pQKP4VjDN~|99N-O
zQV{H@VMl+kIK|GDcw)|A-grCPo$0i9;sLhgE+fYrVtr+Nkvf8I6$lGj2;B^dr}7eO
z|HYZ9ZCrjsW6iXX5N&JZD2DP<)^3S|VEJZ;zwf4htH2t!w5%0t{#nX>PHl?O)45ju
z;JDdt7}ZLIT?Q}LIj6s&2E!#7R*v6<cji0dkwZrG#slDa6|I+hF@9r!7M61(ZUIZ;
zLY$nMrugftR=Z|u%`7Mn<A0J3s{47El6)3p?@L&TVX?3fBv{Sy7AF^p?hN5OI6rF~
zr>7rJ3L^bz@WS5Yr^)W77WBc~tbgaka+HpYGaukojs{qy5Fz+8)Av(d@aQ?b_y=5a
zX2ITtL5)j4*Uv5WzWssol41~cdqi+YDbkw=_H%}zw_{12VOp3uYwvd1d9A=+_*H|B
zC75G<1jVj!gM6fu&Ts<}x;iobgq<2qmoquBQxEYMW=%jOf%au>#fqPAE{JO?T=!-S
z1>GKQT9&iPI+_UrT!}X6i}nNkc6K-5Fv{v12Gr!t--0e|M^0fdHY@*$4ey8Q7U^F4
zo8oKqp*~sQ_T5wp?e<LPr8{X`TUr~Z*C(*-{o?N7iZbc9)z2&Xo(z++ZUz^8%P=ot
z2sPos)`nT43@49<-cU8sa@<b#{ZB%n0VrAzxB!8d<pW3Jizka?3KLJmUe}COLJxJU
z{F5hzy=PWKxOSz-xv4jho?g`GteEdQpwEA*^^>5|Xz=^f2t&qd3b1aJ9!%>8|JtO%
z@BgM7{w?^f=7>Vs#pH!mQe>d<7A8OH7s-?t!avlNth+NLfT(k($LC8<3L!hi^u4KL
zk{l`5y-;3ut1qHRqpqR*3(5+UjCeCW&u^u=U{g=M>>>lQ)0P4~NB!?^#1u@GAL`#9
zB8O*t|FL}VLX3UU$tc~`Lq!=>BFihny9>zD-43$w@UW0bA@Y8Q4L^`+2`;aatu@Z!
zO?;#+xi>xO5E;_*409&p?A`9)(AwoeQ45SgDqe+b-kVeQeeL}MJNi>hnrut9rXpSG
zF!wiFDdhDPl+-O{9+j=mN;^OMj|t!nf{i<lld+WPL|<a$Bdh4}dE7g1yrE@45VB+X
z+e4n-k0S!-H5v1q+R#*J*4s=Oc5Q|MFp`#d%~Asnsn#w(cMgBHP&z;=waWQ%28z{?
zFg6yF^wK@%-5Cr*oH{$qza=E62ufFN`_6jGVQT>OYArH9GN0P|i5{&rRa&ZZ=K8+X
z**r!|-e$~Y2Sw__L1^4u_6$J~AU+17!L_w8pLv@8N<?PHKGar_8+EREev>yNt}YZ{
zE6_{VYmG+t{I)IoEK^>h@JRUvGqawD=wkoSKdIDlgXGr+dTS87s1;vLJI?nULmw;2
zo*@bkeP#eNR#m=-W}uI*|CSB)q%4wRYSRVXSL#(LEe;jV;f<<FcF4IDJzLKdXktkr
zK$IMtEuz%&VPBwyCgCm%X5VIr<evNm<bJ;J=HnaDJt~{NQOB5@AQf3yLNze9Uk~^w
zKH5_4H`!UnU1h)Vn3%A_(yOEAv0~r;g&IxXvz7vL>W*QP>@9ZKP4@6!^}?^@N38@!
zMh1~bN!WNYyMKZ5fwbNoo!%>#Z#GnwDs{t-%QRg@zKr0N6;J4#U5$O_DVqvATA_YU
zEPxV+IxDt&6Wvm@gE?ME?GrWfaQ=EfV#O6ll=8N50(c6jvv`wRgRWa|htXneM-$_`
z4$jiJF!aLmBczM$KY2h#9FMW<#lThEu|?x8qAMxm*U{;Jz7ODSfE^UJ3EiBnd#h5I
z%+B;+MPdI1Wi1cd)!z}GDMJ2U{7kpr2DwGwf4cpCeDuzz{gbfGxN9!i>;m;#0Ggjk
zw4ZOO;CUp?`pl1}qC&r2Qo@^$4%G$|v&w#*Vx)L&Evio%I|^XLVC~#q%ZK_8IE~}W
z{WD)}QS_-VGLoHU?V&_%{p2UB=Sbnbv-QpP|LN__!>QihHvZKhLzyyX9#T7H2+7Pw
zkt4K8W!OrQq)3L4AwmPC6o<kt$5f$C6iG5Q3K1QYp_3sQN=3+fug-PO`Caez`}cj%
zA5PcB<~ywQtml5#v+hrJnYC?n*YTOt`%dU>VA%fqdgLx%sNAhTyiLsJ)wLxtr7G?t
zQmA%@I0#=GzsS_Nvk0Y8D(!jJr7~ac6$NIU!ydCk9WM1_-=vHB`;F}jcm&yu&wS8l
zOO^OKY~|RH5$X2wKvBB>HvZC$4CTLrE`m<>HtU)BPvgU%bT))e$RuTmI}Lq*b+X?w
zy=Rku;p0n^)K9JR^Glc5zn{bL(*Ky>2o?VXUGk>>?*)1O6U88r)!U<C28nIYEchn1
zmmbLYdBB@o0RAhJx2IK2SI*7y!cV9MUh2LBjk2We4%@ZnXzRE|m;dVr@s)OqmQ0K~
z4G7-;l(;4r&=~dTe9C$`I0lfHj;_W(Kgv=sQ0H{H_4*XLpIETPw@Y<ega7Flq5Db6
z{NHUYe~<GGJl!r9zx)#Od=DL-W%OVh8$RnxI`;0%&OKgm?y-X8TgNA|va)P2v?{p6
zT*VpUbK(|VCjb09?vc65ImVH^DJ@ia7=w&7*1-S{#^Zz66lkY*DRw=%eD-HEisaOV
z{BLh`wY5dTX<BipoOZ6eVktZTrNA!PmfPu5+J|zIHKGYEM)}9Al3dxP0<ngKh`8KO
zeU28UjHuB2-_~5mhrWFK7Hg7a1O_fW*v?J>?FlEn*Y18IXqB#QtHZ;?bNsP;6u!@7
zGGppC`LB{)fR=>g03tqeSNDjen=%FurYp$N#Of{OSRH-Z77Y$g2{#qgWusU0JJPOe
z?f)YaPCk=B8?y;Mt69R!TMtJ!wct<gN*gvX?hOxn2L%VqqUR1x0pyH%ZgY<|E>1lm
z8S81iZ<3RJaw;f_<Q2jeFa{`37Ji*$5tHrHr%$Q?VSB{>`^*`8$SZ#&pD3fKxbQ&b
ztQPvEnt%`Wh7WyX-M+tPrK#zSOiRTeHs)}9v8ZmqwOiFPw56xbj{yTfztW_wD+teo
z_&x=G+sE1t0{mT4^%j2i_Fg~jH~tz1tm*j9*KB|9NE5e+zq2|LyZ`q(p3<F7+Xque
z&#p2}v~P9~4#vYAswdUsvN4#?snf)LmS0kGNwQ@O8b2@OpSD`QYTV;-lH%@!n7G_~
zc)F~7CK_PP5>$YKRlfK`MA<O{15||e;>C-4?Ec%p1a!b(XL4#P3vOd6u!EI!_5gsJ
zgOfATX-z#r;_jRUuC{>DHw^OQ$O<XBvdV+k-Z@$%r#0g~)>nh25&>`5T_AF&XzoLQ
zkoM6TZP*+ppeI6BRkf%k49;1-u*a+0m8gFl*rNw8U*2MT3>ba$@n9#~IPSrHE@)=F
zKKmxHuNQQ9<XE3-e3Rnx1<=L|(wffsLH{zp!H}w`g`%oV3bt?kHU{vS8}2F>0m^SV
zK6D&DaKmpar3<ze)}^mM^u+%(dMxHkADxsnK(7VqIz%stV#!{RHLA5kFq7eJ#}2nl
zNjM&^N{)?=KEF~}t}NX5=UqXLFcep#pB4^hHGqs<y$PSqUikW=tx08zD}3Lg9=ksT
z_d1?OQs;b`GaPWalVPAGvdv|i7<LG5Z}*5bHWiBKbD!$gws<H0&TmRza!11@-B`Q;
zCY<6#Vc^Fw0P*Y|aIw2bMuEn_22fv}@fww`iyHd+`jR8BJvHW0FkOqokiD>;-Gk5M
zfw$IQ!;3|W+@)A=nST!%p1lQNS+z$W27EB8^nR@l_uB{PkTEbY7--Js2CG-;Qij?t
zc33Sgpa$Ml=(?+m0fEFusis;5eSS`~7aImH8BQ=gQ{IvefVVNc5PROgKaP_xR+n^y
zw9=mU+(VZLEc2RRzILa)TwX^<9K7R010FD08)(T}ib0v#_5r{!d1dFamaGO5*U(4|
zBBLu!GV1CAqxU{1&;|PIZsTpAhN0)ft}aP<^660Bpo^HnZ8WphtEay|HYG(AFR;?;
zo26+ocfCczIa7OQw9mjA^CbCYIWJ}L%T(@-%>!9VVrUlFG|$&J74`J=x<7tAjfZ6E
zx;Ej|DN`pW3E|b--xd9CWp2(M!SV>5)g4qtxB!ZZLrO{t<?(7V2H|Tw7>XA;2Hwbg
zN|0+Io(zD@DwI)Zs2;H%oSdGf7qqhANvI7^ue|U@*<v}c@r#FfWiKw@1RRL&k&y&A
z-ief1Tl8f%dDZ|C!Y?k)wQk)yw5$n&X-fOF9X@g!&<KQY7r_F~QCavN{t5>#Z>;$h
z<Bc0R*m)!z2j+zMlMNG+C06D6AzR5$0wy!E_N0hBjm9;feX-HOg9p!kS>s$54J2YF
zESpu+o=;*bH3CQ>p?^dW6q~xWFZ7OK66~yr<45-nKb*1?upPigNgbVZLy(&PGH3G!
zG|CmhqgrpgX6e}YxH0_yHo<#wW-3KvufTGvln6Mp^#G}8*SmA1^DfU}7{Mi=DM^?_
z&aJLtG3e7GUWB<@3#D$}y43{uEyh|m_#jcZ6K`*2ApEkwW*q&#65Y_TV8@8z(jOqw
ztAa*`_NQJn{QBK_1++&3_)a`z*81y6{`fI{0RF1tg%w}LF{@)|W<rNMN?&A!%lYX`
zD6O{^u-9}bXzkH9G?dm#TXN|AGh-to>W0(ZsP%{5Gl4vwgkLWk)&C-+zR0b5tbJEv
z5AfK>x_s&l=Vs&;6@fa5f$OC#TCWQ4f2T!6W$)GyUxFbs29kI$AmnBk0o^@4w(d^w
zKK(f%#KljXKQH(!Z5=OM9L;fG=PeZtria&t!c7pXM&yKMFD?`a#rd#I9vd5bfG5C(
zzUI*HgE<4Qt}ko2tiK~aJHS%cT50+6ot<}lQ}lw>Nz*+R#KmIj3vjKmmf5scZSBy>
zgIHJi$xWd*zZjF3w1biOm1%tJ>Jd2NR)d{523J~HJw1t@o}M7A%|)PT-h;WKXJaNC
zOfif1zC;i2Z+0^oO01jRj@v{L6$BU93K4jzEo`CLj3_=^TU&A+y+}uDONw86qvbjd
z6DkfJlpFuVTNb8j06|)r4D_o##aB7^qns|CsP`$(6M4ni+4+2kp;>$;aad__4Lt`X
zWuqtICL7~WAOt^E6Asz?FdAetQie5W{<*ZYRsK4cQh*)DCuXO=aZ|kjZkxHZdEMp;
z4-X$7xRR)Iesik2S#Il)N!zcwfj8(CgpxM-{kt%#;&<01oLlFcu25D<i~z+y_{>fL
zt|>XRO<A}Y%y%}UbohaC$kxELbs=>YPNm*+h+sRPrKrU`nfq2b$64W`LUF{H$YKJl
zc@x|(c{VL=hqtRkfj!RfiHIALw!87s(f};&B|t+8fUshh+T<yS`y$a@rR5uW64cKt
zm$fvsHvH1E1!qg*LD&%)+J_?mCUHsiRpCFTHc)&gMN|S-9Dq}_Cs|T%Q*kg%)NUaZ
z=b*8wMJGRI#EnSRKbeO~eG@xp3`I@vc0TazAHZ~5_2^6xvKF_VhcTX=chtb8muuAx
z{-khxu~<}QrpyXKu3QEUw<_+@kbZan9Nb2u3JX>6LH2@H+U&&e>!o;Y0h8Yk+QQ8>
z2Hxa)6ODA9k0BESY{#l1aIv~AqhMrB{DDY|=M$HhxX5PgaZXN-l1u2g*)_-Fc`y#<
z*}wUcP7GjHKR^5@-Z;mzJ-4d2UT4b$J&30sfVvGwj_8;p<l&$4hK6$`-^@*KME1S=
zMM5clBz*gI;puOqfs=!6h0^!ueuRM3yBP7+CXW#pAJ0bZJ+%+FhPX<cHLp3Bmsq(T
zB6gJgA|kP%Sh^unZT#hzTF?_oP6mf@oGpOo=<f&KO2I$WhL+r1Dr32}0XHag|Ni}E
z(L9?Kjdu_A+pXr`a=}+eLqib8kY^GQU3sZy?H$e9ci=`zt?*0N51lNk9<6@yf)_5E
zzPW8+3tw}slv=yz*#nsEKfULm$Dhno|Af_X=-SmM5u7ghH(R_kN$4R5I^fUTe#ciH
zASg9(hbbd#YaT3(F>p(MmSHFjyWo2KjwX;S_qu)Qz53g4a#*No$xnLvk&8vPdL4G;
z&b{;1sEP{RHw|_!^#JTSiJ_2?5RtOdWoq9iCz&wRZv5~i2*@XX35ipP>D@?XDVea<
z%U7&;l$E%wesFNm?84hdu+Bo~X1{6s_AWT`ZDa|i&M8qfmW}Q|VNuBMt^_RH{U=|S
z>|bVnN;DGd(5~7OLhZLa5`S;#IX!*_Pi_*@<4kgLj4b`QjEoG0rS>5@f;Sy@mX?;*
zg9H8~yheQon-xi?ZI1P&hakAkr`jvS4cV87M<YQem(X4jvJM!_K0dlHi8pv0CVj)O
z<aPBtrF<i7Z~Y*vu6@TY<-HQm9zBY%%*H@1q#J^h#%H1(sz3F1moi0?2w;xc!Am%S
ztCWY{04_V4k5x0Rz-sPu+~yyWkjx-fGprA|+0y_Pc4Hl)B7hf_H!vXX=F5K7*ellx
z6Y(U2CCUky3-jj9yK2@qcm3+&P@l!^fN^reNZe&0l)-4(-!ZoXOo?I)Ceg+0GXPu#
zeZ1YKiZwjlFx;ig0m_Y@hOY8hN1ro~-DAFo_r@!Y)hyjCqp2x`F4(GQ&ZU`lc~`>^
z;*9eH-=sbTTl<@EaV0A{p|>-Dt}HS60?^<w_?FA)>Mlc5Zw)>~w1oHTo7q-v=N`KU
z!3|ms;N-pO&bPgU5dMpH)^hEo6Qro!mwvQ6<FiaW)|iImJxX87C3EIJ2J~g(#*~G*
zL0|0d>yy82VQCp<wfxY=6M~v`UK-*Ea`VY3#v~w;awigcz#-W$hkkmjUTa~xySg}O
zm!dt7)tDWi#pf9VOIITn02jW|HC0t~G39eKpItCiaS~44Jgx;RETK3NrlgIoJ6u8D
zxjUf{P`<`Nf5eLVGqUt2o%gjd!GSKUp8DLchIl1<+8jyhBKYp&6j^rlZHH@)Y`3?c
z#tXezhT$1bR&mV6i$97L<=T+Dljr84Dk@R8j&i&o8eIGZN$vPpHSaF)9!U0b_0tZV
z-lJoNVS)X9`*r%%=|X|G?d{D>RikXX_4jNmofnr5HC<VBbh2krOTkv&k&%&Xug{}j
z1J_!M<mCE})wSK-dc!Fm$%J)&IbP7-(y3+$VPS$Q4F$qe!Xti!?XRQ?`(620VLIyu
zH0eNB`8ohQ4}KZ4pXoQ8GxqYL)g?;vQl1?ptC1L}?s+C^by-ggqp22>pI=zmVdoqo
zdku_Zn{qZwTm7oR3E-GH5>xAR?MQU7_rUV~{{9dE-=6)d$xV8`kwAhcH!sE{5_DQ7
zh{}@~gs22q9xlYdti~)mMrI@yb)XZ7u!WoMA`~ImC~|HOZv%>nk34!L%VSvo`jWT0
zL}p~X-9MdS5T?`I+}sEV?E-f8Uc?R(u9jP;JLXTu<@)t%KlV+^&HwQFmJ&wCF<=I-
z;H^4B-DRcj!Qfp;GH^0#6%-bb)_bhH-9;mTBr!bv!NL2@Ju&EpxDzKHBKagID^E$R
zxBH_)AEyX$pD`CNieNEVSz83eGSO?I>h2um7sAQ-K4W}yx;FpQiz*u+3CM7Xj*UhB
zwGh++Gf&SINH1-AXWu^84l78it3ra<hoMK(Wj9q(n;dJ&84Qf}+xtX_WAM&76h_Pe
z(Y(5#9)tqe+ehLUU9yh3T-jQQRqGw>6ni@L-^8WwLZ>=wbB2K&7{j@(UP!!Yg#KCL
z(=}vs08kSa9HbvUfBuUG0JvBIT>Jq+m;g#Ie@n~Am<flQdTI^GEoNXw*%Y+O$;cS_
zfBeH<c}K~$M=1xNj*P9F!HXdYuSr2G*XGTen*cdb+y94#Td`v_-?~8W%^;+BwqYq4
zZ`rb$Q#M)~3>8rjz;og6kE0fHAdiyA2itn>-=~l-{rp3D3^_eLr)NkJ+r700Lw(x_
zYXGvWoP&ddPaHE0_iu&F=fv4Kr=@>MATkPL%F9Et{IK>DasodepUlLO3Q^c`lVDHD
zINWer8O^s7`63Gox1554DR~@HQfn}-M~k-10EuY^=uEbAcO^14JWp8=2G-!wD$UH!
z#+YB>*Ys*3LRS!G(1+vtfR7PD=C@Smk~K1oEzr`xH3m7hG~k(?J#$6|$1qmcZoR%;
zQw{pN7~{g^@La{(dwki;atP(7Dbsj<?0tl=t06)x|32o?qxXZrurvix0FRl4!QI=R
z5gss5n!ArvwgzPb8DMo*B0xr$mzR@FY7)f^?pAr0Zhi4h3fb&6cawvfyZ@=4$!%2#
z450ok#Q1ysN5K=O3jc0a{MY91+7yUkC_UuAjDb!RHliLqdgNE`;N!CfMK7Z5OmbdU
zA#Fm@p$_B=Hx2QpA9akX!h(Z>&hNv~O~onXiA@DtRgkfoTz4Q6?S<i-9wEZ}wB7L^
z6d*EkbnZuC=l7XXq!j2sw0E2{^`GlmtH^IV)q6<M){PiHFkZucTM`Ia5rhgm+1Z@m
zeq*6la>wsaE|=gxg&?iq;D^bDXm65b!<?BM7xLRL#|m)+b|VPOGI{z$l3?IGK!hI0
ziqLy@gH#n%`Xxy@xE}W5?=^Mx;qMU_&$1<ffq@#HjnplV7dMJx$HCv_6j|f+0EdK|
zirnaVgwH9ucF$r`UX*Q9lq(Z?Rp^?CWnLQm401r^>L+~5ttHo%<P_<mlKf2-RURnV
zmDl%MvU<_V#S$P{1hDM2(0o2SRMxEF!6ZC}pwZdY)dWj!2^7j|wC28r&&7(k1XcAI
z&#=3?x{`d4I&<bs1Y{J76fF@B1(+!s1Sg8KiLqJ%<&vNKUl8pI1<i+?DOTzT$F^<T
zc)lb^>K;eQ0Cg)3WY&-^Az2?(aOwup`FL8|GH|d}@siuUOFG^x<!`$F{&`v~a%)`V
z^+%r}P0tJgN6&>+lVkDXnh3V}CuV-_f*(D3wLwRYm=v~MAtm8^!MEs=SDNCWJ|5QB
zFG97IBooZr+a-t6^@0U>^~NGJ_JA`Z4OthMdk*KZpwW#A+vJgMVJV=s@bcU49ZyYq
zao*HFaMH<wp@#~%r7H6QMbc%YLCPi8SOPHyqQG0&1><(4$kJynTsV%$-2<6ZThehq
zOgEZu017_d7bzz>|AZ$}k07cBq6P{sf~bi^(JP4L#-DtMdm)tu=rN8X6;hyc*h!wO
zjl#It_3qJGM`R;lo2a4kbQNsg!{m^%$K_ylasmkv0sO23OsEo+0KMXi1^C$_TD@vf
zwrZ*f3Cv~Wcf2}{^Z=_)@t)`6p-6FxIz9rPpx^xRWwwrP;D{;IG*dlw3{#{Jv%HR+
zjmDawJE4g;f#Xg@d5{7Qc^8DrpcCHnaADpk%7NXeKABota+L*+j-2TZf|f4!YNb89
zq$@&Bv_pjpD?8d4R7%L@`%PLs#=t8(6naB}7AeD$BT5lPDQ?J8EVB!#V%W&bM)MKL
z2JK_l1!|HhD$V@MmaR$#kC+n^LCv?fW@n*V;D{3xrOx5}XX8X*g6)#UpqaV2T!wbV
z<K|AaT8?C*tK*FbRqWHHlQ#?nJuhMsD{>5<iMxjfH!m-*8f1NJ2~^|VMz7m)nwqzt
zjSJYeo=ZttLB*jUdNJ=(tCtY?B{<$pCs~PIFjS-&7WbG|uhloZP8Sbn#Y*|D7zOc`
ztONdf!0Q47zXS{8)tf+{K$*&-oTU)Whr^Cbi55lWq)zq*&c{{NE6LHg4YqtrO@h?S
zSQYP+h_*FLw?}7WJpnkc)-f#o17nAj5RtW8?1qdQKxPmy+-|#bF8lTREk6&jXQDoW
zONVR|H3-$d=CEpw(;bRxFFU*{nom^!$i)8Xq^EyE!^iqdh>3Bc91AE6JiMIC&)^Ur
znT!zE-v^PWEoPq&QkKh3>|L!pzvooPEe~EW#W-QQup-$Kv-I8j_m-|XPf>9uX$=-l
z<1Cxbl0uh?BkLuA#&s2cOED2_L^VA5&Rb?{+y|H=6QnaDM<^!HP%!Alo!RLktpXn8
z;@6V+I4%U$jFs^NBV%`yay=3HlaVl2BTXf*O9G2=;}ojGIQ=X{<K^P=n-qUk2?hh3
zQC4B3;BM5CgAhQ+AI#?^IU06<r178^WHOy)sEwO89ka_bWiq?>PdDS?6twc}_PV`&
zNC_H&YJ{YOJ|9#<8I<yw7BZG&Et{E{>3;v-p;t6;>eKFtp;m5Gt9~Y2Bc1UmgUACI
zA$}37BD1suiOTlg!xa@3k_iVS-$q2K`QS=;`qC`3AEI2FJ-!+{IylFPOpGT?Nb}WF
z{$$~dl~Yz0rh&&_B%7Az_+$CI(Tga76mP96GzJz!?ex!IzSLs-f%~UwC@efs92PLt
z!ij^aq@Ghf9Lu`qbXR}~KoFsnl56YgbXvwge?HdgWri(;c;0uVhveV89-UeU7Ke(z
z0gX14Fuk0WPtRkp=&?NQH+OSmWSoD(lGfGo>5N0g0r{UwGyQjH-i>>LLPF?kF7_dQ
z1WI0nh5?i#5erOS<N690UW#lY)b2C}0lm69$j+|W*)=0BUkeSwHJHY<)dpJyx}<RO
zBRL5>4dm4!w4kcl(&J=hwHPt}{g}~Zq=2NDkAhq6S1~E61h?wrJp|M>!CXQC?m;9f
z^?<1=_^T|L#Ib$I7mb&n>j6@3)#ur+{C||q22`!NXR*!EWj|-iIE?)%eq`V&Ydx&b
z_G1Y09;>2Kt=<>8)d4gj5g;587`Oq%>msPS@;AX1SR%=;2Fk1so}mR>a(Jjrq=!@l
zzF2(p)>`IJ=n}TIZMj_UUxTuN49Xy!`(v;t8vf8G=>>|CFWu^DA=}1~<y=9wMvl8;
z;2cLe(<qP8i$wqK{)~*UuVQ3Hz}^BA8!GTCnNKl^Y(hp#Hokt}*TzF6iBd*r)Eq=i
zu5-B-QAz2#fel%Ocny6qA}$X|Wo2T*-+%OtB;t=_sgEQI|FU6Wg$i%pydj%3(Am+L
z%>IMT3%O$Ek!%3BHiqX)&v}{r@!|$kd%Mb`v#MBRi1Y+zC}^T-L(k}FA}U|Kq;&7#
zAdJ!tdnQvk?8j6;Vk#%friG1Ldx0i8NvtpM#Dahnf|@;sQB?Kztu!1<{PTAGy8h7e
z?YF&RkbU&s?Z1r8O+IY274PrRLfw)dJS@?nw!%bcq;8^onmkS2-4#d;Hs$&IPcvWm
zY=vq)EDg2@*uEaWn>3)6ez$s=?e2gN3H7Dlu_>^Sij_=^;p>Ia?S;w^JW}C;=+kt|
zW3%tXK$D&GDqY<jxFI??Vy+NfoR_SXa4m{tmuT<0hV*m^HNSTodmzBU&#M6_XVt44
z&Z~Zw1UH4f_SPE5?~FrnCkycbNo~-(vl~nu9A51oefsq2Cgkp2S;I(W1b|%<*nZss
zsl*9X?BhXY;XGMump_edW#UvrHhv#=bnHMJ;TIEIc{%(?urFxdShp}lmy(1WzAY?N
z8g`;gkL1?`bG<Gr110Gb2)$gmW=H@?*6Wifs1rS+>jG6yPYWNlQ;Ft7*^nRFu4wG@
z=cP~;rsn1+ke0+@N!)Z8L8u00E=Y=U@@-W21<58^pzd;(`d{HRHx!RGS2YzC9F+>I
ze^c$i6Z`%-p!Hvq>wkXq|9db0|DbgscW%+gYTENnt(S4~n4&DqtW9s2Fr)qlddjJd

literal 0
HcmV?d00001


From 663e8b6c35e08136451f5de9f2c582ef92ccafc9 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Sun, 19 Oct 2025 06:04:14 +0000
Subject: [PATCH 03/48] add amd perf benchmark data

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 docs/amd-perf.md | 47 ++++++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 46 insertions(+), 1 deletion(-)

diff --git a/docs/amd-perf.md b/docs/amd-perf.md
index 433ff59..ea60664 100644
--- a/docs/amd-perf.md
+++ b/docs/amd-perf.md
@@ -1,4 +1,4 @@
-# Performance of safetensors on AMD GPUs
+# Performance of FastSafeTensors on AMD GPUs
 
 ## DeepSeek-R1 vLLM Model Weight Loading Speed
 
@@ -8,6 +8,10 @@ NOTES: `fastsafetensors` does not support GDS feature on ROCm as there are no GD
 
 ### Benchmark Methodology
 
+**Platform:** AMD ROCm 7.0.1
+**GPUs:** 8x AMD Instinct MI300X
+**Library:** fastsafetensors 0.1.15
+
 1. **Clear system cache** to ensure consistent starting conditions:
    ```bash
    sudo sh -c 'sync && echo 3 > /proc/sys/vm/drop_caches'
@@ -41,3 +45,44 @@ The experiments are carried on MI300X.
 
 
+
+## GPT-2 perf tests based on the script [perf/fastsafetensors_perf/perf.py](../perf/fastsafetensors_perf/perf.py)
+
+### Test Configuration
+
+All tests were performed on single-GPU loading scenarios with two different model sizes:
+- **GPT-2 (small):** 523MB safetensors file
+- **GPT-2 Medium:** ~1.4GB safetensors file
+
+#### Key Parameters Tested:
+- **nogds mode:** ROCm fallback (GDS not available on AMD GPUs)
+- **Thread counts:** 8, 16, 32
+- **Buffer sizes:** 8MB, 16MB, 32MB
+- **Loading methods:** nogds (async I/O), mmap (memory-mapped)
+- **Data types:** AUTO (no conversion), F16 (half precision conversion)
+
+---
+
+#### Performance Results
+
+##### GPT-2 (523MB) - Single GPU Tests
+
+| Test # | Method | Threads | Buffer | Config | Bandwidth | Elapsed Time | Notes |
+|--------|--------|---------|--------|--------|-----------|--------------|-------|
+| 1 | nogds | 16 | 16MB | default | **1.91 GB/s** | 0.268s | Baseline test |
+| 2 | nogds | 32 | 32MB | default | **2.07 GB/s** | 0.246s | Higher threads/buffer |
+| 3 | nogds | 8 | 8MB | default | **2.10 GB/s** | 0.243s | Lower threads/buffer |
+| 4 | mmap | N/A | N/A | default | **1.01 GB/s** | 0.505s | Memory-mapped |
+| 5 | nogds | 32 | 32MB | cache-drop | **1.24 GB/s** | 0.410s | Cold cache test |
+| 6 | nogds | 32 | 32MB | F16 dtype | **0.77 GB/s** | 0.332s | With type conversion |
+| 8 | nogds | 16 | 16MB | **optimal** | **2.62 GB/s** | 0.195s | Best config |
+
+##### GPT-2 Medium (1.4GB) - Single GPU Tests
+
+| Test # | Method | Threads | Buffer | Block Size | Bandwidth | Elapsed Time | Notes |
+|--------|--------|---------|--------|------------|-----------|--------------|-------|
+| 9 | nogds | 16 | 16MB | 160MB | **6.02 GB/s** | 0.235s | Optimal config |
+| 10 | mmap | N/A | N/A | N/A | **1.28 GB/s** | 1.104s | Memory-mapped |
+| 11 | nogds | 32 | 32MB | 160MB | **5.34 GB/s** | 0.265s | Higher threads |
+
+---
\ No newline at end of file

From 93e247ead66d53bcf01ed337c758afe0df0dab87 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Mon, 20 Oct 2025 06:08:42 +0000
Subject: [PATCH 04/48] fix image

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 docs/images/fastsafetensors-rocm.png | Bin 54504 -> 50678 bytes
 1 file changed, 0 insertions(+), 0 deletions(-)

diff --git a/docs/images/fastsafetensors-rocm.png b/docs/images/fastsafetensors-rocm.png
index 526b695e16aa4716a590668d9f9b08e34d1c43c8..7bc23242b2ce37a90dc223eed03e4269dc087a22 100644
GIT binary patch
delta 21353
zcmcG$2UHYW8!g!8fPjIZC~%b|AfPBYsfgGjIcJe1P0r8=g$b@8piPpTV?!eux(Nyj
z0s<16+yu!DGzc^~%qhM1|7T{sH}mGLHML|d!0M_x=X~G(_TJ|!W^xX#1s{6nd+@7y
zA@s!s%H0VYPl{<ue}r~CeY|@8io$Jl;pM)IJ?_j5mXQkYkI<B9-!nEck_y^m(mA94
zMNsM3k&Jbg<GktRNUN#6z1znc4j;e!;Z&7rdw65zbfPO|{hs*HW?PJ_=CR%%e<Q$=
zJoWLI5CV~{efD75t>SULkZsFMrb`AnM`|6KMj^*CaxA{u-ME>Hf|oi;Pac1%q$PG$
zN33TKTR>lsU(_z85%?5BW+o0v8)71!1b3wgICKV7k+vkqc|sh~`FD3-aIzXN*owFY
z9|kx3B(_93f<Sch>90Lg*4qydZg!Dr<~O2S5PYcX;GOd1V4dapfW#3|MV0ytXJy4^
zXv9v&EGb1NF0*vI_$1#$3(qKi(d%~u%w|GGgtFBiU<8#YnL?eqwo|wx%|+8#6}7wu
z5!RI8RKxC7rvu=Iqi^4hf*YE=H$mUyh?1L9_wXS<W|Vm7o_tFQvl@Lr+SVe$WI)I3
z_IiPjc1xID=ef9%UZn-axyGS|fp@i#qCh>Fzf(?Ykftj_J!+i7-<6nUtPt3JowLc9
z$*L6DlQt;#EU`wzkY;@@a?QM?eB)!{!18l)|4-`e@b|H0_Bb}uQrVQ-J|T5SzWuY~
zA$ZF7&ac4_RoYzh^VIrWOE{kQ$IpVYGql9NIMp#Ff}UAM0ZLpd1Wp@G=(9<P!EXHh
zd_NV(`OP}g8mZcJwq34TYf>bL)iSnn?j|+VJ}p#TxkS`6Fg`#jn#)}?siKU0al`~%
zKy-RBzw-G(c;59toiqWn!T9D*hr#gT<ikl#h{U6dk(DXAtJ^!9VgK4@z&Jt>S)_l^
zLNuY@x_fbcQ$rzC0}8QumciL{Eu6DyvDa_+QB>NbwHGTqhHM*7uLFqN`NFAfU*W}$
zBwRwfPiMhjk!?yEi+!SzXTKz|8)W1dhI0SSjzWh7^v>$%?3ZA!wMs0##3@(aYr1m-
zlP=iNI$>QjGxxR>byi0=xVVS^dwZtNSdPf`yWlPmLfl6$3XA|1X=TQXF0I!yzSL##
zzDG^}kyZb-1E@1Ps`Mh&_dP|=qwnw5R+%T>%@-vZK*@wWoPdgINsaRB(6b@NQt~N&
zchF@E#)|9nVBQh_25%XwK;-w>oH0>tFRPv_8KhMr=b9mnRSl*q%RF`Uho#Cw(2Zph
z(1Pv3PyLV22k2Nkc6rXumE3R)dw9viF;L6ik30D1iz{x<&unQQk+ZY?uR8`FMtnN*
z`Y=c)1j6gR+4-&YwRY+r&N1Tj`HZ#qA&gVZoV$2AFZ=21mj+BRIWdNET|?FTT`k6n
z{QXSh3m*}PipRgBRiuHliK~9lEM5c>tmg_3<1|8Sgnqp+M;*pFx*6`?!3$RgKH?sU
zw=P=PjI9_GP&U{O9VTxkm)9RajK28H29K@bm4SV8!BtF`lebhv@s;wb2Pr*&IR+jW
zm0oF0DMc}0(#PD<TXrtG7?5-#xqE*tTz$~Bm-@&t@DLcqOL!F7H&~&xxa@E0nF2?)
zt5};axK_k(-SCW){CbP(aTU>avvy)$BkLRYFx`0G%;|nT?wD02ilAfQLHGg!EC|Hy
z5SugaQzgsJ@47ZVlj%T3JUPTs#oEcPG3GKuOi0T8p`PpaW}%vu&VS`mVcH|Jp3yE;
zF?QzN@Zff7&-9|YiZ}GUZpZE+EwY=I*Ow@QuOyhPJ1$Du$bl@)2Fs-lE;K@r?Tx-5
z*G##l+xU%}rPnPT42a}j+p32}UL5HNUf7#=4jDh9mv^#c1Dl<?TG9Y=a8LZ~?@9Wg
zY$Y?Y$wn$CC*kKBZBQ3XRNp-BSiY%W#cEJmVR03zO?^;1v7i%!H3}=MR9CK_LrYyl
zOka?1uvu74(7|L7dLC)UV26yOj7^f~;}7nBC^l9tuavKTGN^?u_$#=U(`K#4QN(Az
z9A9YyiO}Z5&!k>h{79&jT>x1m)god(okc#=wfw4yH1fehGR(vD7$SL%<1-Bid98#|
z=zMjTYZa6APHM)5i>0;Kx~$hGM35&7kIv$cMrS)dks{I~mpmRIk{5*`4<1h;C35C=
zoKeQ2uwPHNK(XbwAJ&07_;Xb)+to%nyHx&6lqoXc?(U0jnam7M8=JNJ$WCSI7JoOY
zi{Mk+8747k3GnsP&w~E#8tpO})2=~ifAUhuSp-6h`2>Iuweh+gdwiaQn6XZIT)F%K
zM3VIlR-cGwE@yj2ixX=58*8z6%QDU;O0KxsAiHasEw~$}&C@5kNA~b9%IhZIac;(i
z)hMjqG_?4p_IgaqPaiitvYvmxXCZ^Z&?w~X2?S!tS=xdYPM~KGYB$zSLeyd;rlx&I
zKSPC3)1)^oJHnOQe`2srszR%?!=3>^%B-Lxd;bH>s{NGY0)N|&wz`+7OPIXVwSTqt
zZRQ*l*u%@XJ1L(!hCsw$)>(p~(4QW8{B7s=P;(JVbc})1(+p7Tc#+FuhVIIwVZ7iZ
zhHubvaD`f%N5!P8K<diUI^)CdCGTx32~#Jg(y;!TcFyRMugU}O$_-7echY|;7ij-&
z`Yt^U>zi*i{O}+`&2Xte7#_jKyK6o*+<B1v1<OjdNk+jy59SR1@+!3(2gV`?1jI|~
zs*i0gO(e2S1I$vkUAJb`iueYC*zWPGQ}sVsZB5kD-f=?4QA5h6=><LCjcFn*+jSF?
z^+IeV?=mZtXT!kmkGc#;3MeIN=-D$NdV3!f`xkOvYEN7xKJUDS>@;OD#=Un(+Zc`=
zAk|W|1>}m5s&;;+AovzK+H5Lr?T@-3HSBIzpc_hZmt)Oz;w)tFyY<tv{H3K%wI()l
z_aUEP`nend_UuFf6Z%^ha%={t$Q`tfwkqqj{LON!cJ!bY#2@`#%@7Foq5|>y-L2(x
z2RPO2@5zfCM@Deww~%;y3;5lk;#)px!VBJ*bbbuJrQJ?q_J5&-L2wO|!J31V%?g7t
z`;#qQl*Qc0plomF_mJjmE#a+alOx`VQ&s1a<wUAiBNkSggIA|Qg-R&j1ns{MrU_eD
za?UnKu%R=@6GT{L5#8BelAj7JuDfI`=hRZd`H@L%1}WIN)y}fITY!W_bAqZO94Fno
z{9Q?E%Si;13s;Ed@syh^9qC`m2)dNP(zWpriP6tA9gHLGKFD<g<9DLG|4lIp*S^t_
zs&^CsyC7L^3I>W!P}KdrolDPF&2mYgeYfjkPn|=c63(~__Viwm%Nd&dft8XYg0FnH
zJue$BeS`2~WlT4JnS12+%3jT0{2{rS0VqN#;t~S~l6;o*2o#)}Ha#r2nR}_YZ8g9}
z6k{TK?dVZ}W~X5^8;$3`D%8<OEXe()&KKO2hn-v3X|K>Z`BBe3SzO7-&-k?mpH8tt
zLTX&Dubcd29}TsmhAYdinA7~FaLe+o)Zwp@ZTU^ZnF~j3@P&73yV%Yl;vxRlI*nCS
zU?JLbQFq`&t?rS~Cr3Wy=d#Bqo4ql1w{)Qo+e*4*#4R7dIh!jPIbAd2<J~Cz+Q1%P
zx_8@C-`Frd@u_dzUiI8fxC&EWj#HloUks!4gP^Snf@_TU^c2N7FRw@%+4;drcc#5n
za9@7+)=8zF?P~4^m_5j`eLd^Zl2zoS?R@TqA_5=7Pv-PHO$kHOqLT~6B;Bg?CyFt#
z0YvSr58TjIZiG0q!K>b`V*ABh9ny`E0yoD}HP-ghYC`k!aG`y-RGD(=HeiL*M=x?8
zK=`{-w(I2xrUZ+bB1d-Z!A(!>V(Kw!U1nvG6hCSLU-*0s4-sasOVCEM?feoEXzja-
z95DWXBSa}{zE9JV$4Fu2-O^YpW#I&jw}<J_CyDanrFYv@enZ)g&=)Vk^SWiP{%tZ+
zqXy}3Voud(zqcLfS`{YsJblM!L<d)$tt<AW6uq@7mu4Cwe@$uPf*UhEEeunmH@(&m
z0{+uhSr>G6ea^}DW8#8WH2hVU{~42R856f^yoF~W?2Q<hX1%8h>b&W~9qZXqn$3_P
zGm!2Hd9rd~V_5SL@rG706POm5ObAw5h{ja0f`DN@^(SCf<OJWKjmcd2D;WgbgIS!d
z=5|F(w6#61<2)P69guhE#ZV)Cd8Ns7rhS%bZiE(Bo!mVDXK=;8ntfG0r`YJs-sNGs
zBM5(*qi}_AYU4VpKrrR$&-F9bQa3Q~6>^QTU2WFYnz$M{*}HJQ0f*MUkTI?J;)uUv
z<yG8k9oGIUfi1HOYHfW*^C7}<kH}}cx(8Fhg+BiUBOBCKInMqh$^<>pH;1{jK6lSh
zE5wLUH~FJa`{wHSd;5o{f;x9<!m#!h@)?m9v!Ryl{Jkbx9KA>U&t1R_DJVA6+_K+>
zA~j8B7M%7@XN`5{au}|zB`T0F^gdKSU^Yy50)Fzi?{G9YSnLjOJsr`wAiO$8S^Uk#
zS0Tu!#<Tarhwi3bbe*c>O!#gKCvtIZCl22r8qOIhId2eOXo4w`a7-fXrC>M=+?+x<
zbKEU*G4?kwoY7;QBYw|}gKzc#tkiN`^HQU|dycwDp`V%JYJci;CzfKc_hNWf!sK#~
z`Jfo$wla!Q-!!bWR$J3AF=MhnE`lW<N>-DLduDlY@MN^6O@@9m_Nq?SOhat<8u$N+
zZHiA1D2Q|~gdCe|Wi`E8o2oYsp-JOA#vy^Z3iqlt*Id7tWN+)%8st24U(?BN8|Fiz
zbL(00xhASe4HNJ8er^33YPRo&XMX959G8jJqg$u%iIZXL4%zp42oY$yN^8Z74SJ9H
z7iW0hHT3OVcNS>sOQx;#(IS`lNTs7zZt8anmc17Yb<AKIqgpISe!m4W>;xQOpZGx(
zg|Gy2*{)F>ON&R7IdhPDtfcObwSw5e{QI~IjHffj&^y}RlM0b%D?q-Xv5hYu@;7l;
z(tP5t+kNS71CfH=Y)HXXtS1qOrOVv)*H1Yf8{;Q;=cK(nM$ac9p>JbjGfbD&U@2{S
z(-C*TlzD&jq+=kQkO;(IZvyjR2?!4V_A7ttB=}zTH}3rY^~P2BDSscMX**TFbqyl9
zsK!(_Tb@f%#bBBQB|@6LeO5%uifW5#_s_Rf%J}QuB#oCpzQ|qT0FNa552pw#iWMN@
z2&11)hD`_pRFnJof*HOpDkU2KR;RMKF3rwU9nYQbqljU+cs`})eGZWfA~id!2l^}g
z(eh10tudGQj}**XT2Rxv{zfzFN|tl`#FatJ>9Y+-cXQ=VBeD+wEf8(yCG{3n{NcNB
z%%fqtL({x}2B1cx9a&}U<y5*&6`}gHpm4*6_$<+9$wSLmj5TY^qpTdH$9m}XEjL*R
zsDOFg$=4f4Y}8zM)+?30eW=rnLOFfvnVDwpMBdCMo6zHkwnqleWmD{Wnfnl{Nx^F8
zr3<nVqouLC-O^VSe9sNeE#pbKGSDI7=Ok`;kV^-+=m=Abrh-U7oZXanhl!|iP*j*M
z>E%>>Ixf>qW)awR7(X%Ba5P|!l39Ptccl@%)Y!`~&zzn3E5C$r-PltgF7t|FP5`&3
zdf?1`Ys*InHDjNX^tSU5`GSjh0-3E#Bbvu!J%`f<$OOR0J6qzWXB+43(N()wlY-bw
zFG3jjK|UROhJIWLsx&5j56Q~F&fwiF`ZZKod2iDg**Q@r28gbdWt>l}N#@S-lj`af
zB^ZHY2gW>P%74i<^9pGdZ1kYZx{QV6yy9v6U2Vx*Q2)uo!!{_wAfp5Anuj>_jj@SD
zHE$DDCM`doS}@GC)xfUbVRho$!JdL2Kz6jAG(s>P`H}2cI`C*@=RIBIrH;{wHga@#
z%0Tay;oRJ<qT#Q6&I8m>u@G<dEk#g_XC`sxdd^2j<CXZ^ddhYV;c*V^Ny?PHOie9K
zcj)h@d5fLB-ck(liqEcm-mcx>RgE_Gh{0em7Q!*BO*~0n@nWasq5bWV$PXW~lav3V
zE{>Q=dCV_mYwGA^cBCotOG+ACzI>VG#*<gV!oqE1SK;Rz4cp}PA(Sy*ddDe3r>qnG
z!3yvIunxtZzF1Ic*z8@$ZA@2Ebb2AaFGAmZcbwwp7@z)<Tku1SKC*8e5t7%~{<dQ7
z^8u*Z5-zA#b>Z^cfmR+_w1A+X&S06n`}RWlTrL)u>$V3xr>+*E+C0w@U)`LXoY-47
zn4`2T>8){M{MWCmVOBpKqMuo5m+Kv>bY)~?!`(1%m;oQ`EV68AqdLL*A2C|;?Blf5
z`WzWI+{)JytrW1#A4FUU-p1zLT#ZxgzE*{ko!zcb^o}VuO4F@L1z~iJyBJs@=DO9n
z{nc!^o}SYPC(%gB1q^2#*HX!VW&a9w3)f!y^P3f;76ZTFb&W&gQsk(uLyV6L@pA&L
z1IdoUJt(EmeyqGg@1U<1IxcE?xZEyH`E!Jd@{AlOiPc5pq`8*2>_97F%`MIWKCS^M
zJ*B4Rzlt*t*U^f7%l}2_fna@xOLRR4-DueI8^$X6fKwges<Js_^?|yQ*5?B<Rg-Xv
z?7mvMM$WGXN^H{fi>+pVq{veuYc@AG(JQTDkcj=jE$YIcE~}JB_n>2K{$xwE?PPQ0
zv=;zbAjo_b=Z|cWf2d+YxsM2{&YGn4Vx1&zc@R(SdRfGseVKZzc5xhav0n|)OT2mi
zN^>bQafW(e^xh+G&C<E4J{q_6SevbDz8Rqr%-MBL<i|E;!^7JdK(vs|sq>09O3<oy
zgQ}!jY{uCv<JX}Y_5wo%S!K_XZ3g$|aAH0q<+0WKhP23;yjl^03h-{`-n1?f+6NOR
zV+&U_sejve*G=F!wIPPv)Qx*D)-BfN`_t+J>9NrM9;Ik$$;o|TK$~AD?;YpvYL{wm
zcJ@+sSDyaOjP&%1Ie2up?QcPzi%+yGE&<J;f#>flSUy>HLasW+YQ;gb*t^_DyGIA9
zQT<L_W@u~cp<Lslskdji89wdT>Gi@Er&&k28XPc97$@0t#eAf*@0&Gkd9EMp=FAKA
zU}EbuZZTC;SFoWCV?nfi_t~yd50KHttUm6-Qk55>nb7XE6;f_|KC~rio=?El_UGEp
zt#xc0v-hm~CiaHsJA_a6Y7<uI1T|H>Q~s-@v5wDtL{1|AQPN71v52;^>AB&CNam{t
zMVffZo{GnS@hf3|j*rVUkB^U&rs>#auR#!`aPMCHM-}aP4+8kNy|JO{X(ZSi6JP>u
z7c!nw%b@wWC<pu)MiAEf{VOlGH}G4&xi!oZl<FX}iV2rW2IkW#aTiw$w5X&6Q(nLT
zFmB!n4ye<yGnAW+CfV*1QjBEgbjZ`^HlW~>;C%2?FCnB$St+RlSLe1MAf3l_hT2AX
zd|>pj5w1&BEw5E(%P#YFF;pACvmVi8(OJstyE>I9#ECRzGf8`Xf|UyiIeHg223q@$
z56%VGV@t33grB+~sTZ4nbzf~g(0;F0)~>VN?)_zX#sJMt%StpfQqH1Z9<5>LOuQ7W
zBzSI7$T^~ar?Gcz>)DHPZW#~(==s7%zDR<Rprw@+`f{pki<3k(#ClMT-}pGR53I(8
zkGHIgJC$5Hk*swrd?nqgF&UAI3J+VFhYDO>S0ZL5f9(dXRBZ2XNGLLBpni$(+jXh)
zIYnH}l+Nz-ZFg06Ae#9&L{1};GZ`2rTCSg}RN+uH^VF^|B^as1JmL;p10L^C;~gv8
zjGBcu^M$nh6qiaU9>v_DCKW_Sj;oi;vGnp?xF((5aJi`{W|uk?x_=e;w(8WQ@xm&-
z1?*oett|OIeP^o@=evA)jJ}+@d3e$BW&5{pYEPb|5~Mje<QE1?U3+<jgmg_z5*zu3
z-@bhtzPHTgw_z4?QLN2(sLI=wRnqN&Rk6OaGjaP?L$qZKB#?zWY~=q$$iH?Un0g)+
ze1a;vB6F_IXrYD>oJZ0Kz28{+^tjtkp9Jx*IrgOmhY{9_A7qTU!;w>6-!yO0A$#^P
zk0L9ZMdW;62XK0H43%(ER*o=!<(YRhrl_o+9Borqj<g7V&q?ZkoJ|*DWkc?v=R)$9
ziOUT9<hJL7`m!8_dr{B2Y#FE6uguQ)P3gE2ZN!S3p4}>ExY#J)<D|3k?1h+!i1vvS
zC$`oG9Z4rhFJ2tXHz<7w?X4tnApveh5K+YP5kKr1j{6TVW%h%ayW8tn!*U0nd8xnt
zx_#il0m}He*othpWtZ$r<J#wZ#;4)s2BVF-9tWw)-Enr^Jz#*TR-eS3l&Q7Hf!%@L
z@v4y%7(yJ)noZr7*aRk}&)-Se&hO>6Q8qEtW??VyMbO#)gvlV<x9`l(<IP)XV7s#g
zLzoR-CB|0TJ};Wz%st0|1se=AsWVJG=c8lRqs93_eKpk5N>7mT#D}c|q)LMJ^dWV1
z^@m7g$L{(_0Z-C14X{u;C{!-Da%_5fI;XMsWF#h3)@>nFit?kvd7OcfG2`RM>m;AW
zYI0A0oFIPYickn(uJB=frF!-6``6ZoOjg#qKjVu(tL+xopKl$a#)wWXYQN*UZJZis
zWBB>N0)La5(QS*28qtY`o(d?*I=4?h^Mk)r^^o7&p9lGSX^ICpvC5cL@2!V08tV>(
zbqxQkN26Mf<yr^#9#X!K8YrtoyVVcIcI_?(Ez{@6m?HjSM=tGcjECVTFiJy>wf1pN
zbNS`u1kd4)jbG#1Mn-vr#Tr9zZ*OvcaTb$+LHegp<`*q$H+}{SLvgJza{!<OS8ZKW
zUut|9?4W}~q(Iv%cdviUWZfC;+}z)bJw-X)|1FJzA7Vw%L_^pwHo8w9N0?Bq-v>TF
z&q6Jrm@x!dO|UUQK2N;oN`Eb?%W1YK-GO|rS4VDop*#LiaH#}TfNm(0-9B{KZ}QxU
zVOd{j>)UmeoiF#oo6;NEA)_$4y^RxdhmRgbHN3qLd&B&`@~h*&AI9JH+KsCQzirN{
z<W#-=7J~wudMl$9ZO<^KKDK6oBT}+u(z@vBy#x~q9vfyy9O<bQBw+7?KnD}+7Rm1k
zEhfmA0_P+b*ai`tF%W64v)y73qSh*wKffN=7jQtNh38+jaNC_xs(H0LiXJQNX*xcJ
zI*pl;^#cY8(EFT7U=+Gf7B#U^c|>c~>oItA1W=|nZO_@=?7=2lWDQv7rgn>t-V3%w
z&O98Gb-wP0B<1`%&Gw(){F^t9|D#x@BOllPMGb}Q(<=Or>nk(8-a3+_q;<2p+ph%J
zrS4=pm9a_I6$Vu4Y|qvqlBK)7Gdh)O&*v8LbbjE%Nh(bz@IWN-)<SA8_5M*l{wohZ
z5Hqs|hxGIDHzkKX2X^Ip*C>1~K8<DSU{SJ2>`vVOp8Fq_1o#&)GXEo!vP-XJrp@vL
z#Xk9<E%fC0jQDr%@Mw<Dn=k(CdH}(b4|YP3ohd~eCZQAa;##r!PWzAbTcufOtdGG4
z0eo~Du%@!`_6gmVv)G#l(qHd&ONwQGTsH?UvRwYN_p7jfQbx^o6Ee&L-bA46&~CyD
zf#)pmeyE%EJa!CpHvkrC4dzsJ@wC!p1oKQ#1O-U>=`;T>P&ScbgU*?6J6T=6f3doD
z|DwWX;AR`su>h@~*ECHO3h(CMLF2m;P-oQJ2i3=<e{w+Q{ydsfig4U_bn@i!5Y#O-
zrJG_9Up1#9UA-q8p6Tf?-Qd3&+}}F<lzL;cacb}0pOyN=bMNRYauJ>cj1@KP(mRnq
z7eXwl!-mlB<CEfVgYftF><WK`A^71L!@m;(PWBt7`*SivJhE!}N_FKpO}<o-5_EB8
zE&IE^AQCT}5tumZm8D3k^kKH`_$)G@?e(B??aBpVSWmXyP<98@2NZn0eA~o)KmXW!
z;5Pm@uTNCV4AULRcCV?BAP!yzLU=_DjSK~b)JFq%=FI$_puAQ#%VSDK?oLoyjpS;$
zEcvE>PRfbtJoaR6_@RHV|LuHh5yNg?e9nNPm{w@D8vBBwOC28Uh2*+E(iAzVtN~D$
z_4P68@{~89OGNG$^~|t!p$=0+6W?arL<hM5v!?@@`{b>ozM#<Hx<{1a<a!u+N!oI+
z(yzC%{b$LjEU&rdc1_N4BKOOux5K%;cuH#8pz#VrBbp3GYnvWi0T=RXXc5YI#ckUg
zS}#ZYHs1A3sL?6*k;$9!zrJ2M8z<NK-9E_%OwLx`zLx%@-$D0B83IFTn9oz^sX4_&
zK(=bwxJM+@J7o2ybVi`Tz3#5z)Ox&YKMh~r)%Tp$#Vbm!Lu)ZRkC=dRg;+2IaqPco
z;lI*GsdJ;<ojMa%bRDbgDaw`$yhv1f(rMT}kyR1fUA$o5G*TcZkc3m3GfB4=+fn3>
zxm8-fK#uF%3!^`oeUSaPEdW%_i^n%&EWc%U_@y4KTh(bl7RkVnUn(KBx*@dK^e#nl
zU?>?--X!Q(>GKiuBfqy45r{S^WZBc!nhi66W~CxfEo>}SPAZ_CR}@dK(R3@*ZujcR
zow%dULYj9`Hd-&^%<=XLa<Kcco)=2LLCgP7JUR`Z0QS83qjS`^ju}#Mr-&Opz4&(D
zsIsE_+nZe0(U}e#YMmX#8pGvvTd29ccyIK9fB5emDG;IlEB7ml?*^!QZyyeSMCpCa
zm?6^BzV_l4Y<x$GH{X)Z$bucM=S)y*KS8hEF<z5oh9EXD{od076qfps)kC07PY5{>
zU*2x)mp$<}6RQyi62%&mTk_LR*<ig)uwYO*q@H~B3rqUKCS(&^Y5$y{3^FgQCa#sB
z+}W{kzUJa;6{n4H8?K9D4XI~R^tP&iCKUNACoOT_DGsPV6Y?^1i2i2KaNn=jck@I^
zU8|kN8*!gshyDkpsyWu~l4`ez4=1t3<tSi_Av-l$DQZOm_qT&@Qrq)au=6~ke;KVq
zBJ3t0qa5TeF0Wl3G)bm73sCP)`&isy-CcgR_^J$@*=3A=+G=YMTX@G)<N{gtSo}Yh
z3^0KlyXoKbw$g6TWpPMFn7G_K!pH@0jF>pZqZ`V5vhN>aWIV0Iv3m;JrEL|{EtQhL
z)9M%5wi$Dc%+~v2La>c5Tpc1>UCGu+kaTxj8ok5C!^1Bi&^kEQUGa9B;4O7HStkf`
zdR;DmTR`~#p6Ia0D+`>cKga(Jb^gZ?H95WT`(yDV0Z>(WBfyQ)HfFIbv=rFi_I?5H
z!u&o)(;ocZPy;{shyB0%YyVp(L;wF>`hV%l&>vUOKS`gZ`>K}A+!3tbtJ=Fetu7Y=
zT$GFlV$6Gc2`5YW@=G)b!E;A!AB?Msyj|9Pm!vO|LAU#?;*qQ9)T~-cJq-t33j9G2
z49MgqzG5W0$n?bk_u*a2Tja0HR$l`*augqa+;fyq9Nv}a_4P1XKTrGgJh|fvB>N@z
zPDmbEQ%+Bl*&5ZF(u_2NCtp12qXO6yTgs)l+p{&1SQY1EsjfKLf%t+{mn_0Fix#K;
zJZ@y?q;kD9h9Ec3+nJZ-S}Igvgkc!9?%4=7XJoaIP)vibgjjqG!^=|c7d33-uP=^t
z*pEY8$Yx&W8JtQ72I7<}Mqb`yij=s7&(y9U?5+C*tq#Fki!bbtpgp~e`*&JT{wkjd
zvNA*4k_xqJ1;!7$X|Fhmyg8xf<*z^&opO+%xxK<)A~1;aHeA-$Fza4@2hYW5p4p$<
z?rt)&HCB_4wTwK`uz07ia5gM|o|L4E`~D;__TDk*>VU`mO>)L|5UC)z+1Mb-+0HNk
z=Wb8wT{wG?I`4naUG;>{+g4SbVB{U0;-B()<aoO-WqS@r#xK?*@aUe=EIt7<ubcmn
zzhim#D>?D(H6%-y$bEBsgID*aM75Ss{`V-(jQd+Y@lr+;;$zM(+1fhAT4R`_Vsw#T
zpFwWHfxDZN2KWL!m1u^G^I1pL_fQOz{l5Wu;~-qTKFuZS#plEg-k-tuoB=x+Y}3L)
ze5<6yE1o|^zl^NVJm6x)ontffBlTP^|IQ1w6#B{OC1ri}36>d9IBLL0{Y|G!Sz#_P
zs?8L>`Z!FFillwdxzHko$3vpGKIJ_Rxy#7@gjhi-M4g{3h_Q9yD;3+_>s#H%q={Na
z<rtFEu&)~3!#dtIq)6(irIfrlY2Q|4Ygo3M7y5g1xb4XA=fnnxo^a>!q*+i2F?9R3
zn_Rr0*h~d?Lv~s!*OxrDeSUHw5o`A{FOeVpawn9_D?w0R0h&}nc2)@-$z>laP|}c}
zaJ+%Fzx!^0`_kaJr>a9Gx1Wz*Wky@E+yi*7voFJV;;&mOCD?@i_^~cwC^DT@F*H9{
zB<|6}kk#JADwnXe6PNu45`6Nm-RLHFj5rbmD^AV6p6o}DXI&Brqt!~djwQb`Bv#{;
zQw}hJRe|Q#*50Gdyx02Kt{~#IX*qV?y^F7xhSF<ky;D$$j?kUz4!uOE8PHEJomFHP
z?U$5QYo~oAZDSgElFzMir^NM)=zpIpCTvjsvP3su9C1QrSu~VxDcjbQWx)9hZvJfG
z6FWsmb94_)&+;KIO!`Me@xYg3__+dTr_>08sn2T`^td`g>1-}BpY&O&Tg?KgkshF)
z*n7x-U@AcL48Bl#a<|!j&x-4{zP5o`#W@fcqjk4os^>-AdMj+aIyYPaMx=Z(J{`m|
z<JreOp8`@S=nO_d`?iu6%Lgz{2pK=&L`J6veB-o%{9bQ$(|b7fLuy)-?w$N2l(qV}
zz#P+;r+4E`a_bf7CL<*n$&Tu^0hcL~UnfD!#O(!<JY=?m!^K(I;duQ_0eug~DE5SQ
za)6=s;{tSC%tF7%uA`}X#`4`M8ITohf5I)vQK<VX^#xISZKin;eP%D0d2CU=aaMS>
zKtxe%XU>lXqA6p{b$0VVx)Y1ov!@>!>0=d?Dd$v@s2x-l`_VqH!o8o^WjQl0unC*?
zPGtafNIkO6zB|j!cD{va9|soJC!^=mT90JmuI5-8`QuP*IPMz<PSSt;HYTj~*b@at
zT4p&Y;;2;9=phM`iSWBj6!3Ynu<UE&k3wQ6wcF93;qZG56~_z8OJu0nH(%=l=riE=
z#dVQn(^5<w|Exi4b164KeedMzP5$!lIZ0hgBG%@KbWD=cWT>=Q?dzl<2rji}e`}8&
zu!>RUo{W+x6~R7AauE2Dd5wTb7A3zwoA-D>ZA9%GpU2e(s}5{5H~)=pRgXX@MOoi6
zw)lqWU=cR45#LidyN^?O--^;PtJEAUUf8npN%51Ms7#P2yt*yZFLWnre679E;L*vV
zSdg*W(-v_|ivl`G1%*~xrV0eDw_{kjJZJ$Ba!{dq9GCswWVIw2s03d|cF<&(_!P5R
z>-%+Uq~<4zNb*as(tt4M5zoFlj<~!_?|Upq`Z3j~L;KuMV;%pQjIrx-RVpq?5Awco
z?bA;`R>p~}VDi>%D*p4<Vy1L;rD(6OgVVU0r;8`#R~bd&kLq$?jipW9Azp2+)d1M|
z&r~CB3otWU{1O-R#Fso(Oqo}amuCs&`!aF`0ROrv#E=FiljJieX&fMG5oP1(P<e7*
zFyob>yL0tp&$FHuEywfQuXe@0RMcJGG7QZh+I{Ss$h1g(#H4uCKuhCuO*N2v+<$0B
za#S%}x#bJa>P=0YEXl)7m82YF8S8?4!PzwB*rVWXzlGL)zcvvy*ATYGU;F*$<!ves
zx+2pdWMb9TA$v^plsk`?7{I&10-wmRIkvRRA@c4YlkeIbVH}9JlpA9@4aVg2hh^Lr
z(AA=B{`f|{(74uS3{`v|H+qsy?G@E7C^3#R$pr|R@rs?~km685^mQ1HI!Fv#>gCG0
zyj=c)D0=yU{ka!I)9Vvawm-|Ez{qVvpdQ$eU;MYzW~ip>oLu+!iOLGyNtN-EE!mo~
zmUkw4iTPrF&FU+Cw}~f;b5$y|Npk}XERWSu>9r1y>^aO))=51;8s2Wb;UfiOCE`<4
zzO3F)=OM|xKKWjQuSd}FgU%B(q9@Bsg0*&!WBm%`pS&Z#f>`-S;(X>0L^PS{9MOB!
zTuvwv&cC-$iZ7VuFQR@9koHUnP(NUOiwOuEkHUZU94iwfCbxb)ej~{>$cglH`&&aJ
zTbofu{^i9${M<sjP%nNpZBWb&N!Llu=O_VraPek~mXTQndy$o_L;vFRAPuP?P>f!)
z_UPp;2vo?x;7iT?u6*4iseZKbL+(MUAE_|)p!=iTMh|7?f9tuqdoJSaSOG$=7-z>u
zahA>cl9CgAb8?GBN89@35b;`%Yh(eZgmJ*IUR+v8Orp=m(XANwjskiEY;J3#;c~m(
zUoa*3heXQ$Ro<ObXnLtLvK6W)-u#-Gu7>^2&70PjqHV*q_0+Xyxg|6o=j(xt!e{h#
zU%v6+*JZz;<0aqhFh#)$10VD=Rm&Nl>Z(*Wih#n9{nI5nw(;myK%|xs#lWs`X^9_*
z)duG<J=KibHTvDbboh@FUpiw+C%<2QS#{rYD6xXaB{><odrWl7wyl9&PyzDMXfP}y
z34aAt6cMj)puh3=@n3fYF`Cww3X>af$hM+HXF+8^on=j)xGwkls2-@DITb@0FOM)9
zxPH8s<iM|n{Mx~z-f(1lmV_niU>6HK8Bqhv^RcJc#X0^Z=Fn)@i#%@QUddDqZ?9y9
zvFA*sf75jP2c)oUf4$5YN#OHzIvd~|_2Mw<_`hbtM%Db2KvC;R-r~NLI+y6WgV)G0
zPc#AcVIml;h=3!+5_nA&CRM6`b-m}?wz<TbJWQ1zYLsK+li~Sw2>OpHu~Bl6pah9Q
z&yqDZt6DeFkVVk8xa`JLzP$9hABu4_x%0ND+QaK}t92&@22JOkYyO|%-G~49sL}79
z4lq0ZD?$C7fc@O6aL!iTtl3!(FH;Ix)eTJlYyDSa+{&b+pzfgHWi{0`Na@{IJC|sE
z0q!IEtwHpKxvoXZ!Rt)e^wgj8rw(Ty{ntGZ7b;OY-raTRELOVwa++4K2SY;1?l-0}
zO7Etnif?HP5U~v@lnKh-j*9?E_ga=x5bc`g%d3z`(6U_p8PHqyuQF`29a-e<Y~e4~
z9+Ujla{{^{8jL2=d$0@j=_I>kS^EP17D-^wYw!A5oj53V4+c4BG`;how*SmqJTo1W
z)=WrJ=r@!ouizI|(%eyg=^v?pJ#}AiHVv<7RkJEgYcA6jrH>vdz`C|v5)|mu@eUgX
zU`W<ke|pvnCjX$Efk1i44`u(Dx<&vM($>N0(}~~B!C?A6d0)nUnf<j?;t918-<mZA
zm2L8J4Vgk@h72AiYaNtzaqO-1j>27Z?XY(GL7&OUij^{kY@l2O0kN$8npbw>4l2&c
zu6<ahax!*f!E7>0vVHlR|GAt0U=#4(xhJA4OQ;o)c4_|jA#9#l9`b|To?@4UN_2{M
z+zK{tS~wkG+FZjvrPqAKdZsnWWp%RcF5^HLx0@y)X+GQEiltAEPW<bfAd-5xW!0oY
z`?SeRLpQ~)eag$cae&8u&N@oak!ecSq^wqNRzcfw{M{uhZI43vO^;}u%*cwCb!h7K
ztZG6k7m_wj#ZP9`?q3@Mk>sJUa^3yGsm}J<jDc|7%Y^!jr*TQ>^gaegw`;ql<cjop
zM?j&}-!AASgsFT)>tX`_fwcbtqP2K`V`&rkH<p&XpZi%EYl-PG6T$x94(<|Rc!M`f
zWApDQ5Kgt11c_@LlSI6VHee&{juOr<&S#(aH(f`&WCwMUhcvQczaGBI_f0kBfE56}
z<>vT-a6{bWv4^W9$`uJ2PbanM^uIvO@nnZeW+$5Z3p|)|0W?e%9snWEC;jPKaZ~z`
za8{XBBsANVe`FxSQqG3`Q~&*ctwULRV{}YUMs$J)K_u{@2+;mST<z|IO<vuNgVVA7
zga2R<{G!3Xg96y}zazkb|M&k<+v7*iR^7DvuC}{HWjudA8)r;FQOQKO(dy5!_l}0|
z^LEnyj^cPjNY_MDc&W#NL8<+q&dZ~;8dg@B<?^7oz=waA#~m)nD@!>plR&{Mm6JT;
z3`(A+#N4!Qwkn>@FCSj^c>3o|gwufFhr^EE-j#k^vpk>yV#L@=G>%vcLHT-xb;0ld
znT}8F<G|Qxi=3aglSokc+Suq5(b(8%JJ*x1T~;`_P&Bwe86PQgd7!GQ3k(;OV4p#q
zHWV?raN6IXNqTo@e>;raBIpcUkmR16m5*NsFDFNt;STee<G%d*!1KIW@Qb(b<;!=#
z4#l`lIpOiyD(Fj>s$6~}n@^rbWy@se=a<K-PoMEOxSRyG@|=W^xmL3tKy>?kk3=}R
zd=Dpje&+NtfAYklP%q;B`!V&z_wQ3)y?O=l4NC7U)w75>#BYm(t9uZPnSvFZot;Hk
zgq)=7ue;6sxXi`H)np;;Ep-Wz?f!x1z-ade{sW^EA9%*>d79M|gPN|N8o$=4VGD1z
z8{^$N_zSAQM&84rhzN#|3pekd<9@W{;`ZqcBLl-#X=x+ScW{!1X2nAsp*DA2^&s>q
z=Z5aVPfa&e>vWB;^LugG3{^PesXd0o98Dhg*-nM7ELB}+=Rya<f~aF4=q&twWG%dS
zxMbq9P}<zw+&Qwp=gBJjOb={+cBLu=^T~Mq;{_s~eLfO78kr7yKAwL6a09e6i3@<;
zz*uSTqJswy!YyCj525ej2q)A(bF`$*+zr3m@cVF*{g+9BA3w3n|C<~CS6iLa%lUJx
zj87TfZ8jA&9K3%0I>&ou3cu1O6&VxbJ>cuR^!XTSsG=}W2Rl$|tD7&%9X=Z&w^+5(
zX47~OVNC<AaQf4Hj^NeIjW;zYMY-#2CCU2YnFNjWa;nnP?}7cO3J{c+<61LkW}doJ
zhV;+zsO-pt_FliLv**rPipII`@2)2m?a|BasO5WmEDl#gSJ@EL%u^4i9(FsxrvFmF
zbfS+6ScM;l=%th4O)lV<gVcbZnvNBcOs}Y@K&@+ojY-h{Vccs9RS$blvx0$WV@W}b
z{L-NW_qj~4;ixM%<n)q|XI39T3_XNs<DNnym@%Lq$akIO$p#)|A#YX2cgxKfJ)6NI
z=?1FqxAz>SC?cQC@;46DNKLhit81xMD~s=P6Hlz9JK4r~JkGJE1CrbOMPChe0?7lV
zSkQE&(w`|GNXND^4`xdQz529zcWn^WlNUpfzH#GM$&&+4drxo{xO)p=mxDPy+SE@!
z?S4onjZoF7;6-7JzuC|;mn%Vk0ofKz1jsl1=2RRpO)(5rPMApz=8FWKA6oh*hLKTG
zd{?i28#F^?LkGTxTOV8D9KHD6YDFT!(1S9RBUH0-cd=$0=TJGx<hl9x8IIL%P1OVs
z2y7`wa*{x!k#HP#ovRgW#D?97j*LWNz`|vyBuFNBoEipi@-(-!FrGd=x}fGybI_H`
zl?x?Q_Vm*cUNN!tS4kgP<vQA9MU-TG*0i*=BCc>i9K<YD_I#7-0bjr72woHkU&@(d
zTI&be?_z~5gE*TU%IDrIvZ+_2sSKx2Cr`D;&Ap_T70(wR0gF^>({=y(^XCs$RC>O=
zIXCGhDbp7Bh&$h~Tm|$2sXIA+1ZkZIT7JA&i|zV_0ZJ;3jg6h8rPT(IM5PcG(cRwA
zLTPVziH+uw!-uo|cDK-Ab!0H&wZ^tzgBV$^KlXp|@+I|$JUtRKjGhxHwd>cobLUP_
zXsAwmq6}Eg*e(`+|AE)u81J(cKNy*rZ9$r$21;`5MB~W41qD8oN=1<GY*g9ZRZVwt
zHxl%T1^xZET9!(}km*gFX>H9Kv@n=;;ii?Boj`b89Dfd((X>`o^3jLucfcrg9z6IP
z6CUoqOYP;Cks<lks3ytc*N1($kN~1U1A^Sn(o0TW0Rd$(l3VzbCr=m{7}8Cu(X&}e
zez|Ll$&xFp+3IQCx!U}@OZD_{2!g>7GnAqq_DT??^+5NU^LPWq%gc)dbBOB2C4kA*
zoh${pmkpW-_(1Cb4bwF>1%=meRDsC33V!qE%^UoDQ48O0?Lnut8@j@}sUE=H6np@8
zPkoQM85tX!t0Yvd1$q^<dj<)f1#k$7*!8JRPEKxthah5gh4M{nO_XDAb%5RRoB&$r
zB00*?q2uj^o82k$#{lRlV%%CqdY{gAX23WVE9QuMO~XvijC0Viut*O$b-|_iJY2DU
zjW^CcKgRY0gnqJsVOhmF=630ow~C~Tj#cWOB=_iskc(L$myJPsXiT>y5JBq)0N|&6
zAI;!Bc-fsLd9dP7SEis=5U#G}&}5{p+lcS_?6A)wF(cX}7j6Rs@d*C23v|ydI_F<>
zsJH_{znsl`;!MAt=<Xu4-^J=VlyZ#ynHtDgZ6xxIPJzinha6(0Ub;#8gwfMWbb*b|
z;MeggS(z#cxqW?ltm00$HM3NRk-8>1i?#cpuh|yr6%4r~p#j5AqTiNHrIFz7a*Gfp
z{Y#bi$}P7UHR^o7CbT<e%Ed}D;06l-B4}&QbU!yM5&h72YgPThg9nk$pr3~fCy9mz
zrl_cBwT?z8+jDVvpvt>=XJ==Xj4dEjdrf;+XS+zI91b0+uK^Shi>*~(zj`$TfoD<o
z@~SZLo@9jE;6P_%c8`t}F(HedT{dr<LQn<BsRmAfyJ%?HWsL|P3m76Qzen0@JVXrD
zk*WZ|EH_rfHWTET&6mH=Y)yo#x@}HI6XxJn8-R^TY`&}NaQJX>DX7ZrmRPmL=U6BC
z>VQ?#^6&t=qFZGC{)IKvPSP<a$q)Se=D2(Lj}gqtv=>Fshp>nUb6&u_?e5kZui2*D
z1pRHUb)qU+UD?^$*JDNPQE=_1EW6M3fRn(C4jZold;;GK)$Vkrh1nKV_soFC$H-kJ
z;k{pB(D?wf^GA*xxexNH(fw5Y^*w3<1YH0bec!{Q%<O!?FVJ6e5d&h;s$vebnp_Z#
zYxVm1h6kMaR>ZdFJmxKRu2<LFII!OA%a<?bdyPF46gTVX<?J@Lw{`J7H`}Gh)fd_K
zHv-QvGHP3nAf7R=Ox*Y${%O;Gd7_C@N!dsO$=jZ00#d5bZB|1bQ)oX3iGr4EbIMR<
z0B2fq^60DGUaW5Wc^R}@#`6BowA}rtPqQyKebl>lKah^~EohMGyvoNXX=X|nSpPst
z3405w0i~m1ab#c@1f*D9eSOH=x2HVy_4Q-kV=zyoSAWPyZtd-DFVZ3#z#4(~Ble_y
zL2C*NcX(4@g|m4^4HR`v|H=7=oaxV|ew$z4S$vO|=t`>sNDtpo8pqY7SLu?WSPiP)
z1zlrz;)(5JPE#NF!=B*o*?(oCt@sO6xQB6~_MOv75U$X?kq<B&F!x1puO(>j={I(4
zi4tIueO3V)@+=GWEJ|S}Dr!GcvzxvPQHi=iP*9M@NR98LllYL_p`)jM;N9n>Yh;Zg
zLH=R0vmbzlm{P^<z1?kWNr~1)F^AP`Ij7Ov>vN-{j{%mbg64EgsNeDhCZ<fe{mu5+
zo7SNq0i*{UNO<l3{(k%x87tFVP`zdl86EBOjA(!fpuITdJOq$ta$@3XceeT#v^7_t
zt)b!4S$JTH_Ir3Epk&jvpsMHV7dMPs&-_S1FIKO2*ZBH?Wch|F&9!b%#7rcPgYj_$
ze@%r!0f3}<enF*)YpcjWxnmM23K@nDl?veY=+zEIn8ty^K$!FW^_7`CTulILG&wyz
zy~lLVeX3tc5URWfI-n>LolgqkoFxuinR1(&1+7n@)^z#~r7F-MUD}JYVvj{%)4zh$
zZYu_*Yh}ato}wbwwim}nm2{g)1^|fySY=Rb)oQcINS}=Uz>jrkH+nPRe^^LRZ*Ol8
z<|A+?EXWfZkg<HcydC3Va)L;{YuBLePtOmPI*!OH$B8N{MP2IvVbWb@Z@At-=D{Q+
z<j2Qf($CikOOjfw(gZ<gE|h$(G&)q}Q)9U!V0E0c;L~hWjw@IALKe!;b8v7_0n+f_
zx}_yH@~rsm*|XiCxZC%Ayn`7s4So|AwmvgnJ{}(*&({KVl{=bNuMa~$U@F7m-lq>A
z&XZhP1R@6xEXjNi2Wj)V&Q25y;F3))m|3VtpnND*&=~);EndO^grrYW{m4`pXcL<$
zZkN^c^Q#G<XU74EHTK(_900<k6nF8$g&e@J^c}0IQEL<u78%ZM111k{`sG5}_T+U;
zMw{Z&p>$606g~!pPhRWbjAqZ&zp=2ko`YM6Z?)He|A?IWcCNI5B5h2(<n!z;SO-^E
zSIbfZMn=ZT4%KJRs!r7}ZJ?JIr}dDr;?AjiYvr}G0D-il1&t%#y-Nn#<WYcGyh}VH
zH>|RVy!JgZo3`&I^9C{b&P#Zf?fao31x(44uO~AyGG^hCfaY!zb$Mlllyo%l0boc^
z%*{!04g146Yri(_>);+U?Q#dw!)Z-TP1S+Db(nU;bParb3#2)9^d&vHnZKYLsKTM%
z=I`HEpN0dmbEd@+^do2NIpSxzNp4-r&24QxJDV$1&>IecpvLciKH}u}IME{Uupp=F
zbelH7_|*a1g31;qArqsV;nB}8MZA_C!}SwH4|??ZF}Fec@>xKaW%B1hW2X#&88pDj
zp_O@1wHQE`xrFOf1^d+!$B`Nol^OKx0cke(h9@!G4JWCpA=l--wXPyce_uf%ClyM)
zTUl8d^!BY=dDFLV@0u)@9|UQMG#&-T8H6-U0bxd3K8#k<%zUH{B&-`)za*V_gbMv{
zZh7o%RmESH78Y7t_h5)PMt8{xvP=cvbrz};)6+~(3<DO@*vpsO34%gqeaLlreO(s-
zmWosj0Es3ms2C<tpl4WaVU6c3AW$jtfq)Acvq*X50dWOW!><huC;-rGy)eA&?C!!8
z3boFD?p&G_r9z&DS<r3YoaU3*4OL;)gUtBOPK~flWsFsOqHo=nnVA`WD%Q3H$N=As
zu|Uf5c<qg)xVpN#fEDrr2A;M9l^2}dUwhmFJ_hHR7?~${%nS5y_HHlM763xVFD_nT
zVDC4w_h@SNTn>tDXJKv#ED;d|*#b_=lVY^qHHF2hr`<=BbF$z?yU~7d8u8z$DRm$j
z!0$7_8TRGNJyvNiHMp)sg470Z{SX7eJ(K|3p03Vx#9lXhLB}SY-4xElFCnoRu}gpc
z`t9Ezrf16ogbNEWf=^JeCsR4D#C00@n++Fv?AgzpNr6Sxcw?BZfkEun>MRV5B!Z{y
z-p=OMOj?*laeppoVUgQ6a;(|RgwqrVV_2^iR4oUgq1Bm`PoHihJJXTjFahHg6jT9p
zir5^<Pn|DrCxf8Yb#q%qZYKdY7<x$}Rn~XwDmdq&sND}Bc5gWhRiM5eOZIs3J9^#V
z5;D_~M*VV5H5(K$g9<0Jj7Td`0b+IX^in_=^53|j?z1-E0j77caM5!GnrfwjxtyIV
zsMP@kQ$tg;)ViI`*rVT)MFbVGJ-ZMm<_K5zG$3vP8);^(2Q<nZ)CAPV(in^yfG}30
zzREcaiMJ-o7*_kN_w*H-M`AFkd3o31E?p!N31^Io#NN%AtT4}9?~h;>@#I`Acy#f|
zC@3n|rYjQ-L~QA^O_$arx&4S;Q_%HF?kh}_`ds+<^TElfsa%jq#LzRJ*z1j&jNTa3
z5!$^DRhfeh%?6N~Arli8^&=xA4<0@gK1$DK_YBsfRKN>p(kxq|?mvE<+>xn#(R{4#
z^?e`;LqH|3oYSJZc>&%*AUQzNYklVTfgGj<P4XO~qCFL$h4n4qa@rTdLwzK79AT=Q
z1|sghn%cWFOiWfFsfRy+mrOv_GCSW;$Wvx*Y3W^JJ6M+Q3=<2$u)w^F+<$xCtUKSZ
z_xSPS*MX{i3j*}Q?CdO?JxsYSfF@s2U<kkz1(N>t<y=75tXq;?M=8@ay~nF_z3qR8
zgopr#;w`AwEa5z=9*xKUO|Kvjn-@QS{v6rNN*DO6w|0*RpL<tcKIA=zA`8DR?iS|-
z@US9)vPB7*I-I&F`u)M9N4G%MhJdIupYJPVQw<uaa87du<(QCka36vxA3&f6V3dUb
zM7VI{#*O>8Z~J#7-#KIs2tq?BtCaLlueE;b5Fpym14eirsKP?u?X`z1X4<L&VyEhX
zpCv}A7^m}m1|;5%`=OU?t{Il)X^=+bE(~AK6;mBS&*k3-G)QKvxwX|jj0k>59~BXC
zetiV0eGk2R_ZZN}i}nL0H)OYFIKup}_$V;3uI)0`ZshK!<Mi}mK(>X@u}Yq2f3|cd
z0}cMP!c=qG2Yz+Km{TuF5&wE`%rVt}Uatdg&1l#^duibN|JmDkz^vrCZrKbm000Nd
z7~5G1Qo<AvTshlbK0dxq^DvoAoqU5Pt72YpaXr}ADzWL(($Vqg!Evy%>OOezO@HAW
zLS+(Ia6~`?KtbdJ5tNacNmhln!pj^-{CaSOo{J{n^1JJ``!cq^d&3}gEQMoGc@Scn
zox*!ybpB@zbT<2YJMdFWNf<7rRY0b*fyfo<ga9EIteiLtD<*iJ&};L&NI2aRy{9hd
zUt<bkl`6ZBqeV>Dy*hDj6#xZl;@f*P5Xy`fFJg@e9<Y7cS=wuY1(e5I>K-E7c}Vl%
zr<n1Yv)L>sOh!3jC0t~wB=ZaUa!$nK=3aE|jsn4Ru_sp>3kzmX@BO`9*nY7Ge#Cto
z4Y*I;YZ@4kPyndVJHHx9lfaSav@a)Rw##mR5AHbdsq(W77b0GQ!vFl7dGOIu2DpVC
zxF{+u(L!=I)gWMOz$2cdr`H9(1dPT&-^3TSLg39ZQxaHhHnE?zZvYuyr;xaiAXV_d
z_yIKG5YQ_*K&PW8-YZ&^56TQw7zx5u4ZPo_3&IpoEH^--`Q_wB(uP60bOTuj)G5r$
z0iU<bn5zX&9I7ib<lv!0k@4|)Z_e>F&$=bLfmVVlW)rVFzo1{gz$;@Kk<&ues~Vow
zZ3$BRfWia+6TjN2gx!gSEwEdFasxk%7tlH|wM3v*7u2)z@*V*MQU{m`d^nhQG><uX
zb@vxp2IDGzo?MTYvFp1I9Lbh6l{<Hy!#2R{fB-&GQ5{ex3cBgR-@90k081hc-5k<A
z$ODXb@z=0%urOHO3nI^>P7>UZ+?5s9lW&*>9BDFmKcE++csDQ*KunCjS^&D`O8xa)
zUQ45z4evoU%g(+E&r2|qKqu(Ahus}=q7UU4Ak_e?cQ$^(<0%Dj+WO&!d`e0R2yvI*
zoa}7qM~K)kuu1OQ3|Dyv1qXKlyUT6j+ZoRU0L!y&Qj6Vys+EAx?JhV%zhATiQ<x~M
zgLuaoSf2s_7B;Jj4DxyM<D#N6VW$<8Jv5NU;H9DNY9CLaGb-i)9y|hK{XNN{7x)t?
zVX|8f;1|-?7DpDLj$UA00sBzIy6qAi2k5ca%&QF-9V^-aS`U)e0r5_wm)*DxG##*%
zk`!Nz1H|eDJZts)&Gs2kx`==!h=8jXue2O+`aG71@p*`VF0Ds?;ysVZz2&`Z!67c*
zcl}iT2B^iSkPRThVLc0qKMP2ESE$!_HY55}c$0<Qa8<vt2N*hh{&_Knp%Vqaz%794
z1y)p|$1{-O4fFlQv~qHCX%!Xl75|S?&NQg0D-6S-j$>N|#UjX}{y>&Wi!4Hv0-Z8t
z-xLKDf`}{@DvK=2pm3Eb>Of31vWSRu3`kg`fEsqjv;=G+6hTlUfwC1efXEgR=zHk&
zcRTGLekDWhJ@@;*_kG@TZtuhJoB)$-CRoIH{vapl+_HRhq5^0S-yu#HAJNy>H?py@
zVP4vi)XSAMF3;}PhU{r+Z?~4kD=^}fc2L$Q9ZYmxZbbRWz)L_djswbXB?G&*?(F=8
z9oBQhCE<bKTIond3BTb5w+=4Jt}$szB6=i=P9traTUFKNmzkX%O1_C?1pn5^Jp4t_
z4Hw<PHoA1?vVoadcmLccO=JD5H|GRv(P=d}J0zSMK>m$-XD24H9tE{-CUt|#I+JB<
zYa7~hUcm?Y`twD8`*l-AVF$WbH~bh1vNi0%IF=|~IM6Zis#eDlx+RyqQsj)}RA<Al
zA(ijvCnv25-b+qSPS4ELb@XXCSDl)gN=o&YfhYlm5AdP*!X*OgZTj1fnj(u$MP-a?
z56GAOv9VR4Hc(9fq(jRVegrI)Gm3m8>pfM|hVv5@wf1%l3T)F<Cm=HkJRz0`jv+=I
zdF|RYg88169?^D$8@z(wG&LZ6CHq1(t-Nmf$+(gxZP#B9$cc-KPCth2jK4sI8G*FI
zx>&D#h$-`{eb_0NNEpa&ymztT*A_HdCb28l*`t7e;ZQKd-70)CC>Pkg8x{9pY?uW$
zZ*a7qU(3nYwr917#qMYwdNKojeFyl??ZNmnkyKGxiE~O8u~)mp;#MGg4s+bzZ~2C{
z;EGG7(3sr!iDc47|26BB(w~lX0ovR}U4^#YG($bch@CN=qpKNCPEHoXad4WJEOwqW
zpBp2=dRUFnOS+47oHGTZk7j0Kp`dN;>=I@?yBQm4-9KCD%%>xvLr1>;?%iqHdA<Nz
zd{6Kb6)R|tVsHL!Q8ka^>4!tRc;tYaV9|5$i9t}2_Ke|7?abk&{TbCUqvIfQJ(zPc
z!<Rs6_PIzR_Gu{ry4{|>_#r4MO%5~d^{OV$AlKd1bxD}GMi8|imlxTyx03@~KpR7&
z-m~E%$W<(9J|d0Y#Lr|=do4NY%E}aWG`7LScc_a{U<FWTW4kH2b3qJx6o)8w1QYsn
zde2}8&bJLR`5XHmH(L!GqjmBO$%SF-`hHg&XhSU01xxoJX(@pngA(k*FtChhfm@wL
z4e)?1^xl|)z+siTP=<Ub`ZG>?R#qXk#lXvf<K*mYP<HhO5)siU&=?Hq8T|6Rxdm2F
znJ*m!1^%)KRy-r=4wozDQ8YCcX3`iQF3`WQj8Qc(V?588_3U*a;J~86*2hq3<ct=0
zNL;h~(Mf4zqj`jcHwVUeQwnsq%W+&%UAdDYeRtxtTj9aHbJMNrews8v;n3~Pkh+OF
zQO8UB*SZN6>5^3=Eu~iKMX6~oBWhh?dGFu??~)T^fY$^;qGn=A6jUV!Gx8*8l)c@G
zoPOqE9XR=(C0=7doxedYK$p@L;cPJR@ct9Im?{PuSXJOKHS7kA!#f1rqf7Imqocd{
z{$FRLr>~x&MocB~mwuIT`SQnBu;LmBp*lM|3FCkyk@eO4lA^$I<DEHerxO}2X=<x(
z62pi1So6rf(%0p+ZV;F+Do?OUo&XR;fkYhPu-Xf#_fPYnuypIE9<R@6*gTKc%Y*D6
z$9-F#&T7;*G4TNK@pN%vMl>$Xg^6Z*1KCB8x*B`FyE@UZ7=e;~jrH)Ui@$H!uyEXu
zTABr&O(A}Z2)p3m;9@kSqlvSgU}1S}{u|G)SHTFTFoP4x2p(wDt5bOJ{H?pCbsvUQ
zfWvhB@An}@`|8hLDJidc^0A_#8Db6NV@<R`M9<wdUYP5~C?+mi5pfv-mCu=w51M3c
z7DI1gem7&TGFw_4v`tJp1-NwP+V!d!4M3@a#b}G%RgFubAN1byDYLV&Nj`-vMgz`R
zZ<{xOvoS^&y8^jh2M}(hvWiO34=E|?5D0WAs~}X;q3;>AsT_A}`A>h~CMhc`2OKW*
z;v&Rp&Rd?*3ly=o!HhH`|6xLIZN+2KY^&xMREnsHhuSxWx??A0QeXOpFrr&^F1Cf3
z5*v|bSktmFk`uW>xOc8<5XGNRC0{x?t|&Buq>W$z^4XzlDR0_z3=f7>Fr4Yjgqx{(
zJv1_+LGO#_Dr;$-1f0`^qcSDPd8#UqR+w_u33B(AAMSHTHl|Zu*3rL{T<XJtH~;wN
ojQ_H+;9u@5IP(8b7>utdd}?T3D2}XqLxN*RTeok^ZH^`X35W5nx&QzG

delta 25209
zcmb@u1yojB+b;ajUD90=($d|63P^`ElG5F<=uj!?mXZ?b?vRx3?rxBhIt$$U-TV8_
z`Oo){fBb96f-#=;tTpEy*Szj~Ud!{3FkAUBkzUYas--}OJ@BClZRz5Ck2ZM$=9%bL
zWBiZ@E-d2*3TI4MTrtTcdOXbI7o{*Cnpi!NLvX|tvR$$RbfJBJ=~f+j0<h@cUcH1y
zN~XCuth28*9r&5DDM>IOEFgeAp6hoI@_6K}*rMrDQBf7B_|1Ek*8Fgly)k`0p*!ne
zIT>%H(5DKx*0`Gr5-q3}cyMnrc-PjEj#okvkPV|HV`Jb>Z*Ju^)ug0<a(NdI18H;e
zbuGNZ=8bcMN{&W<r<5walraWPpRix}`4lVk@oCyHi;b9ASc*BH-}SbwW$97(BrGdf
zmulHj@<0)8kX%|cPz1C{=c>2R?j>lL5{%ia0;OI%s{B7~ep8h(U$IU9M6^8(!i3Jc
z7?fa+P(Ves2u4G?F1ftX%uXm%kR$d9bqdNX(!2f8qyx^0iYl|d4VD!P3ybfCA0?WE
zOTQz%2Y&&EeG$C&^K1x2w}1<=y}+q$JB878{m67G))~6o5NM(6?_3h?BqZsp3xQ7q
zqK*`I?P%%9UUfR=7aJ+l4s7a5$VDjR|5VO_QGx3d`6e^vugn*J{Jy-jCMG__MgA@X
zQ3sQDj4bFXSAC_(aM9q!b@g)L#G?NqJU9|8tl`vUq6SGxNtOJLb(&Yj2!U1p$>L$O
z3tWor)UXg+-c^#lws6m6B#155^%E)J;2J`G;pJ1zY8^Sl(pZ7SN_LaoZL#(?OvCez
z#}VD^6JArL9sMekWm~v!#{LjZ2~r&#mqb&4z|=PxT$e2HLEy3O!{G{gp!=D4h4<9B
zmqEq}-{fQuoR41dey7AZ|FYv7L6$XI2*eQ?ZLO^S`jdOlkHshpE`7^ifIh^BgdO5@
z;@<o^G4sm}OR>b`9aV-CmS{i&zcx0j44+DI#5AeLO;5dk_^BLngKUuu)hPJ6&Q~@j
zIFwO{-MFU)KhM^b&A3}VRW4cS)pLE?z}QxC2l1KkcFKr(R>HT9Y3`xcRTYzUq_Q(K
z#8?1*5cwD}K;Dh5CNgL?RR$-a_T#sw$6H&Ah{6m)IP84jXm>oMmd^MwRuhSC4+`!B
zP1VJUN0#%ub(P*a=}?&P5CxK02zQce!Zs>>yhs+*DlvJ81~33=Itd?ruswG1q2*dG
zjoG38F2ia_q@v$y*K=sCma0zxfm3SJrxP%4qQz2l!xY!o+j(y($NOnD5kJa?i%%e1
zNx2sXam+o-P=WdvvK5qGSZ=w*Ln0|X8V3B!o{AE-Nw6GUB;_8a)w;=S0~<{~2d}0{
z*wxq+S513BzH>#n*<d}VxwNF8AYl6@l@t#gS#0ZL#HtbyLIeWJ+W~qWXM^CMFP^YS
zuJKpVkp8&Xyl=_tULYWufMQRy2<OQE$|Ngv&is{B)6d3G*TI<=bdM_h<fC(tv(&dE
zje7#+rcy~?*LJgQiWiUY3!qZf4c^%8W171Kyn9(m5HEKC?bF<eLQU<lYUwP<vPml-
zKmvM}!5;|(27s!7jrqo$deXe3XOGu3*naYxGcmeRij>Sf{{VVm$N|TFcDl4o`pf`&
zmNw@_Xb>v<O|;#@bOxB_s)X8^zMvNwWW5e;RYtE?MNB94o!g_p9Cmho>C*A8dZpZ<
znX1cN^diz^06iGInVTB5pz49Kxr6WpQB!jTp)^p=LN%WP8V+5NjM7!Gfq3R}JbI^c
zk^P|RR<?+T<W^#~1-wt+>F$xo2vmZlNySlq7>EL`daE?!^Pe3NN5ffLyX5p7YdVWK
zk#Xm6%-1wgjqAuk|I|6i9z6jq9vIcPc9}PhLQs7n;(FfV$$9iaG$ffkhCQ%cf)T(K
zfGuOHy`(#Z{^ZQDU@l1F)KDNGzy#V5F@(M7kTgBr&-7w2c-T6wSE+ycrQBer?=KG5
z;$t&MWHar8rV3;(h`!q#9#eAzoV?U8QBp4_S%D^4H*RX-_uTLh{j$W;t-0c@rNu8(
zYX@lT-3M9YlVGMYh|oSHY@Rrv>TuEZIpNh*+%F90r=(rRhGl)<dKh7rGDcR0iFAgU
zv!783`K6MA6RDylkNR8>BQd)iJA?7gVg&0aUo8nVbhFMZHI1u_lb%N2tzrEp1&auh
zdk)_IEinY*oK1!R5yTpXagRlpVYO-lM-D>l5dD}2Sv4FOSWIT;z=%+t3}`F{=05{!
zb1QHn&}bxuSF_pNQwRysP7`-_V2u6lEB8g!Y=}CKa3e(<9l|!v{G&=J(i`6H>J`Mt
zo6>5@*$ck-hcz4|ZynACE7l$k7M7_kh{+J%J7m_+U|fJw8()L+;sIG)!jr!}<|tNe
z<bhZ}@I`$G0s&~reOpc1$X^BLoECZQ;>|jbkCQ@>;}i*$n57tOHk45yB{WxTD<_|A
zSvDCmh1$TC=iP9v-tt$4)$KfCTsr~q&W`cC{_&5X(j5p}fA!Ap<8i{};Ja^)RR|Wv
z`%vJ}7zDK&ImplsHI3?3l=1G~@F7D0vu&+e1MY+WEOaO)P{F&<$7;89woIqc+;pTJ
z+58bL68UfnY_sY#n_92H)amuRXTW}(L~SIFG9E4YEzzq^)L{FM^B+)Zk-$7`(OXr`
zo1d|$&*2&h4*0>FGFs@Eu=wkRk=BVpSt8cb1{x)-)M0wCCK-@HKrn$${N&u=_^R^d
zbK{I8ZV2`+>I<#r-+$0uh2b%Z!KbN;BL#7y&U1}s?16Lct|YSk5eW@(&7Yt^Eu28g
zb@;v%+n#QqK7;f#{1z&mlX!J#fOb#A!3iHiA-Wn!a3AzScl3W-)PVo{suq7y1Wr_u
z@DGUq;{^XneEic!GMpK7Yh<n@*GWmV2uw)J@+XH9z4UyK_VBUQm)yqC5Hdt7j2vyd
z+5d4N1OBXJ>+Uw72UVO?T4lgrFSPsRf5hib8c3hmJtgMIP&UInzzQLw>_7HQg`%k%
z<lJ0IE+@9--4_fu)eRUnfrp@?ANtfXr{xb#U3^VxQx;fgwn|miG0jYKsd1chImOZb
zDHjudKYPW@c~<n+Xx1w9UVpn*jyH-B2=*+*0@DM^dLeI<H2iLS=8K_1meLPfiM#;}
zEe{|-UjBP$rn1F{qFnX&r9g`*#OJa><=50N_Y8jiKzJ-Nu`S#g=&a1^mjVme!?&!G
zyTLm1_;?KI4qmC+kjt|fYeAJF>^GYotK!zsK7Mu*EDkAs<qS>w4qQ31zG4QzzD&dU
z=a0=G0JltSwL&0#Mw7FBIo=SQI&{$I^B#}hSA_~58Ca>+AqOvu>@C|<Bk8LNVRF#T
zf6{<-wSBqs^Y;hT^0^L^PQIruQ2Jgs3sl$*g)7eby%{zny(9g6FL^eX9M5s-jqM##
z%~djv7v6wokA53(#}4eWzvEavdOsVViid)wiY`&;)UlE6&o*0hxi?q*@Dn(&$RI2N
zcReZ(1L23`WU%*I04DY9)>#FgEZ`bw0uWJ)<~oI59FQa+RtgmwYV|6*GB}xS;i`J`
zNIfKcz{5I|d97W=N4|RD6{KAVg`7x&@xob3R$sylz+uqtk!k(0%hB{Y^E2bnNHKcS
z)wpEcGX#+?E7sEf^K8SH+$QhLB)h~n&vVl{6Zc$Ei-#L!FR;HHxA{%5;xa@WA%4~^
z{<x^Mb<<gR{k(QKE6^mFIph{jv~{lne+N|(<$i`uLoTFGrfnd5HBzToZ&84xPvA||
z%nuWtP9P<#@8hReMGCle-nn0-T$`#4sdVg;i(j%H^1^|fCm9=kr3*z13IhH?NhyLx
z$>02L7Hjyn_`4~uu!S($1FRl@lj*M75TjP791$Y8m6*}D)j$aTU08e&-~)jOY7`y0
z-q@fFe)rSOX;+SF%r4uh6a8t;iL94)kG2Y6FpFn<U@jDhH0bv~5OsToM<70MU}UwD
z`0yMX!d7(v<63&~MPMg4&XmA=i<1y?wD=K-OIVV7Zenn=@B#$mBL(wefp0mE2a+2!
z4K>%;AbreReM`!GYZ1?n9xEP-SDnuq&=Pd%1%ZTV2PS+8n)+-@(9<cqCl3hub3-}h
z)a7?Fy~qDux3Em04unYPWo2Er>2pERPZ``z>}uM)T`bE^fV8NuzI~UfHJ>-j{e^5o
zcRGwjrgd*uQUV^kK{DXCE|zO^PkBy(0JnQd#hCc}|3b5J4uU~sK0sqhcmV43YmVcP
zUo+^wzFNS7cr@2w#%$*#+hND+1j{(&T5F$V{ItSRa&Chz3xuYY@a$EH4+<ZWtMjJk
znkL#7@dR@Jt$FOO6Gm=&JC_8JkKfyJjG(TUn-f0{?eYqh>%^SBbb2`69$#+!gzs3V
z<r^Dj;94hIOvPN;*cC0R9$ldT%?yHg@B?QCLJk}@?Z3Y&77?n|boc6y3@RS@CT(d#
z(qw(lV8s5mR_{8HA12CppxtHDyQ`-0zBOe-e${{VUZRc<A=Qs)`8IAa&doo~;_7`~
zy?KnpbeLQ}WT{%~b4_ELCKYWS)?BQ0cR5k%_KaA={MxJc7p|#F{<KY8woh*bzqJKn
z0P^2jg6Y&+)QhB(ed=7<G7W2sn(Kd`y!qDD00O-;@ffMB5H<6#t>OM!LQ4?h=vBOo
zAZSC-iog=;pTr8M(R1I=vG2NOPWu7=1jhH0LP|KUV5?|JzL)Ga4{s@=e%uNHOAhRF
zARJbLU-S2PXB)R+#^?A$Q=lI-^VdQI2*kYhi4It)WGQ4g*kVIOzw+VNf0pO1NSwFC
zX`6>3eSncETPKmUc`kB?h}&vyL#CqT*~Rv}RPxumhr&41wcVA$q1|Ual>VgWpBd{A
z1@<D<TY`hYk*aVGJkZs;!Tj~t1ePX{mMle`V^LQRNXu0UU~zf!lONLZJx0S3!%ElS
zdBegHmSuyxXi_MD&at7ba^7KHaVGcM`qKRAw3z6ZT*e>@!Ey%#zea&<Vb46-Ew*W>
zV)16>hg;N^V4vYYwW#ZFiwkI<O0p%m9vygTfd|tv;*fk~Yh*e$6g;Qcz=KoSla!up
znm<b}*Q`(iq&=^2!9~DQ6<#pMcrRqD9&gnX+-ee3J=6Xd$9)9g`Ax90s)<a7e9?dA
zPi*a#>fr@b{6W7W@wv%hF1QqbiR>}JcK)<@O&I5r<VR5?pLktAA7sMwxkj{gru|;G
z7Yb7Klq9If#COA8iGW_i)J62Hia?=}8GtM)%)I?Hdrh95R7Oc*%f5S}L+9F8*E5q(
zxwx$9O+-t2`2=BP-~qmW@|K~dR}p%s+hHoMk8+m?pFjQa&dA8-JrbdMCC3@>8atup
z^`xCMJ!o@P_;@og&g%x}>q6hQo%MG?C@4jA+(|P}iy|$w_S8Nt)*~W}yrBjpcRzB?
zn`DH_%XMt#>i-&uh&1SBuC_?rSF>z#F6nTuRfDObxr2d}pa@jakus{}*6ML4T`k-+
zP6s+P@sk#uw%7MdOFUzIc?n*RS(<3~CNwaF;mu;n#7hoS!@I<XMCqDdp2JEmF|?U^
z<>_Ka{SKPAO<no74Lw*x0K@akf5LdKq<i3!&l&+1*1PVA&fFE}r{wM750M=HMscmz
z#dPF1nlq@D?|%}TVJqN6^h=UTn78R6yiW;>*K-Y4$8RA%Qo@QOwEE5lUBn1YZB^M>
zN2<HWa>0`d66AiYv+^y`vzsfj&Vpe4V#vIseI@g3E^I$k8i?}pYFz%kfaS_2*tvXD
zn_@8{1TH2Ybq$ye@Sz6}k|N9o*?u8e1iI^D4Luv@O|yGdrw%dOB6XTP&Pgt_V>^@0
zIC*&T6YLjA7l@L@CCM_fo(|418<p<M-&ZL!d$Tg+pPF!cAajH>wSOPO4zb4w(#`iT
zWHPiUoyD{PUW$FC!C=14d|uRpJ%IjD6TCL?18MA*@Z?xEZCdz&zs-QPXdDejG`jb?
z?cMa2cithX;yaP|Ur8Fu4$H;Yua)Et^md*>T0lRnwubn1n1iV+Ju)a!JhHNjUi?~y
z#5I5Z!4PaWhc0%MbWri9pJkkGKYy#QlXt%b^j%TY@}}FDJ;85*OOC(XR4HiKlW$UH
zYjC0C<<shR+}Gw&x9CU_Vll#(-&d~%wh8W7-c=ouHwsH~x!liIk*XF}$1L66?m)>}
zMl#Thgl^pp@zo%yxg-bfzv{AOTBSnejxLvAcpyAqp(=--=TYu>yb#@BNPG|0pPARN
z;PL?mY|Abhxm1NIL7d){pTi_}BFH6{Lz9HqO5E#_YrhtEV(YoM;wEm)i6hNHcvwAW
zm$|@zjgztGSu}4;M+(kawWjPx9zRy|_>ySDO!86yCaeEb5mNB;5_bX5X=`Zbr{rB3
z73DA4O{hj=U@FA}HGeChBHI8F(phy2PM$7>QSvw-Ft++ujFuo1$E948DidS4IBQ6%
z3^a@#pzr!V5dPR8SwzYd(tyG|wIZVLx{V)7O4vHOx&#DLkmG+T{%BaHvv(3J-gkCJ
z1ZVVkKx%r39xH{1Q&iu(2iN{}bia7sDg*p|q2yZT-;ITb<;h<0wJCz=<A-aq^WFg3
z<jJVDmg%4Pua><PZr(Mtl;LL}Ej~PEG2fCnpzr*=C&w3<>)Zg$@)y<(ND3X=Zr2=c
zJgZ4arYF6xKGibY(JJq*ntgKL3Id`n6$kp28uc%LffRbKL2*!k<hHO<tm}(Z&WGh7
zg;esY^E<@!H0`h#xf3{A^2H<X?tKO!kYl&}t<vo?aVM}fLnY`p#8?3*_2R-eSzM=p
z0G!nU{@=AqtSF6oO#a;rV?F8T`dB$jlN1Sie8@!CAv1exJ%csESCZeI8BFsj{(z$c
z`WsU{UnN>;@Zq>bhx==@vb>2-gmmRB)Z85C=~Z6S?@K|T;DdP#6L2-j@fvYQ{mK1N
zVmfdRR#u<^7J|975eDX9&H-zCjK5379U`HTLN9K~RMC%#`7}pVkm#U>ZE0-H-Hna%
zMw3P?bJfNFo`GOKFi7D4Od%utNYqcXFt1S{qUeOWc^sI`Hx}*sT$C)VNCMH}63&g@
zV9SH)koSc-ezFsxLpTd7J8h-7>elZEN^ms;L(+>={p#EQz#&^%_DTSh<vq67a+J{$
zw9$M5sCDvSOgwsBRa3EN_DucaRWW(^9%^jEFPqc_p>t~XpS7;MWgK8MvpQb|;~3&~
z9_qkG&qHJ6;5D{uzTSLeq}%qfUPLTyJcK`Oe0ZeUIls7AiGFy6`z#Q13RBM(AgV=v
zE{0Z0v&{B6EO81*ckeWK_CduE@AD@@h|hl~fRJAdsqIchZMr-EC;Imh3KD77t?w7V
zC5)RM|A9;0dF8Mp>m^&Z1lSx@r%?yXFW$O9&h{@m`@O#okriKE=7InR9$R=<YS<In
z3vdtstQ^1zIpoh;%ku|Ss-IH~^%EEKcoGOyk+D|&O$AZj0j(ex^r;^~1IPXVVuJ@M
z5nv^8+oqXSt5;Otl&eMhMkLrG$S>Ogr11nK3s725&|x4Cobct*PK<S=7(A5kU!?FC
zqSXN#u}0xojD;uQvNAy;|7BwKJ-Dd;s7;6tIljhgH80O-1Yl5+-ybTy8WAkSx;IMe
zYMWB!jdUj}PYQF)zs$E^O@I23r&O6*H}1yx_C;{zVjcn9(vcInD*GUM%8HcXK-e04
zqK66{X{y{Z21Jb#Pmktn7oS@n0&KZgqnAsU_mS2EfEYMj*XH%|z&Kg@p2{1}F&(bn
zjJ?jUCXgeo8?yWcbq$#gSS~+s=3wuPTSp+II$02D{VWH|@ikh~<wQ%=uTv1Ogau2X
z$<s8T^eV}$pm$bUL&Ddq?hbbP1WG|F8C=%7Ov+aMgX6`7NP@eRX6AC|eeqvp5&+qx
zO6^a+IubHu<_%6SB3%X-(_jZ_GDM3AnC;x>n`;poxYgJg(y@0il9{v5W}~4W;cVFJ
zAQuIAT})m)Tr{?i*Kzj=WWZb46Ug%t$?<jb#9?GVN<zZBs}tD_?l-}R$jZ^PVzT6@
znlp8o4j@hbP6h${F|Qrb0Bhth@xXyrIS3?iLwoPF@bZv}bGag-3x*@T49}*1`}nP^
z^Q7lbq4P!iu+oYk8vrBA*_*zo`C7qflWLNTmTD3o4875}>PKd0EG)@$jTt#Mq?{Mw
zofEr@DHIGCEKy6h*N4r|ZI?s?f`Y_pqYch>#?dzeF<r0stFfK{PoRs`K9UK!FYQg2
zqdR?)qVD`e2qPjQ;_B+EzcrNc^7ZSwU>C8+l#HEk9pm6l^@4+77GX$O+}F`m(A$Es
z*f(h73vzB7E;8MX-6oK~y3$vU9LID<w8~|$IEaY02AP2MrrqUL_89@B<-f4l0$?f0
zOWfxB{q-T*RHjgS$=6vX&#@D?Unmw~5FVT0Q<*`lw!oACfe&YDAhh6qc&J8RTf5E=
z|3U%lJ{t9>RPhcByX>$&Cc^9WMq%Zgr}=?kVXtG3W>7Gv{Vp`9p+S)I{RphQ$So(C
z=TWQprpV<I43l;Zrc6A`3l$Xr=c`<D&_bgJH8(e&wY4?G2ML>2f4<I1qt>3Lp`n4z
zc~3*|a>;+H*1<I6?lF1u%zq!RsBJsFH97oBP_7^RKu(?$>pm-c(=4(esZ+e8F>e(o
zQ9EqXnIM!-HEHf6P8%#Y_1yc=RAb@&>-_lOn(=*ZPAx#@<b1FLpbm_)hxjlf1sjyT
z{i2wc&0eJB4>dmf4&=uWABp#-5BU;l-W%l8((|n^F9YM5!?$XNU0RFWAkSbh<Psd0
zWJq2zzWh1(Z*pu{f@`^vr(6@8uk+y<ie9Q-@cjGI?y5D)p?-u$KTUl}Bi7*O*3!Mt
zZ-6LAM7nZT>i!h8K-q9MD+t*)Jb!P>qMRIiCTGSb!DjSkI#Qn=6DgGRnTIW_8!lZX
zJ+05^1~bPrmo?iT%~sWmyK4kvG^YYdP3p%f(K7|spK!QdpYMNkS#U#;2ts}4_y*Az
z4h3(isCuCd21C%NGmO}9y3Dx7c|VDB6yRZGL|ODaMcWumkFcJv%Xsk-@A9Dju*71L
z1&qjCh4jbJQ#s2{EPE&-A#gTL2!YkbM;4m@kof-_hxZ1mqrsgXtrZanq`t(^W298v
zDe3w}R^nlQqNB3`z*^1QN2RhE?2;T2q@-42a<pNAfR#+R8KV)Bx6)%&rZg$XW4u~>
zdwQ(ZMwXpeZh*zD&6T}UFVk#zGF(hzGI&SQOq%=|edPls+!Z&r{WtiO-r7$O+hkX{
z_wohRg4QT;dJBF{twl#t^U|fv>+~jFcND2S(?2yF57ZrjBO3)vkQ%%O@FjCrLCe`}
zuKf7;QdU+nf=nozot2ff;{7Omy~|-|R)p{ee*}!Sccr{z`C8R1ZSC!)9v9XXR<jd?
z84u(P-1R9t8R6F0Q-id?EblLWXLA2KwdSuUlkCeJ<^}`eB2^nTrZSO`THb+auJ;Qt
zY#~R0_WoVSIcoI4bRek>$tCja=kPZ5qAng%T?sTV#3oA-D0%Djj~vs-APNaGg(f~_
z&avgGq9c1zMMDlzSQLN;TMxV`BJmDr_l+7QcSm)Xja#@APn;=__P$?%H<m~*QOn!J
zg-TTlTP2JKYnHsRstlJgovwK6-cArsfWThjD@if0WJ2p@GGFkkN=d0V{nKa(lRJU+
z;lUx=vln&%MNbSA#I<NZVhekYNJMAhgAI#y%fc_^hn8ETpB4l%W{*pjzW@jB4N%JN
z2B+rJvE6nkO$Cq^en03K<@)_FBd{|I@u8z~7cCw!*v^sT1)KM@$%I5eAW`3H6~%Z=
zAY6Y98SlInOZt+WtSl@977mUt1_2K4)#ejy><qQS<^6pf%hb#SSz7Sl_T_}U%O2Q}
z5%-d}dq$8+r5f6N4+g60C%LKP=8wRut_UgTXLpM?S_}Ay2Ep^z(qB4><tMfj^L9Y)
znGJjR#e5&E%c#zh0qfq@<zEg%jFp#V^RSY22(8xD62)UHh0fT=9pSaS>Crwie4${;
zV>f&Gqlm-o#qc0w_4guyY<C1fvh^C+7yqSfvHy8B)Q$3_(6qdG#qxZds#vJT9YL}N
z0k6*F{kys|p^3#;T}Lih<$*jGp5zAnK-V3xG_}}G)CdmgP#t3_*1ZSpu;3H2V%3t>
zH|`;QkRXKf;Hd2xCwPJflPDV`-B!Pp{1Mz)X{I}ff6`#X<2te|(P%B!UqWd|?)){)
z$EQVAg28j#eOp5G><o?V|FjXZS@YcZ_`*0?r}H9SMHFCZJ`Kdv7H-vwTJSg&`kBI4
zu22iw%ig{Wo2srlV18o{GlU_h;OHV9EDZ~$qsTsj9URD)T2r|#wAW9GKiu&w>T|v>
z=3r-!vShuRZgKA8aME-q5=2D~K0TZy47IcnzUiM4A0!|j^F|K+`iW}rR!d6lYdhDy
z&Z0ht0I)Z;prP8>Ellhhuxd6yLttg{O}G(F2qtOywvM`#^%OOHvx9OxC5*{Jc+8%L
zssfDBAyj|A8JubLSI?o~u8U%xa&e(C@CYb{5u&eGpW`EvCT(RM$q&5H2t@lBQPkR}
z2qUwX9HK4Z?2H$HSrShvZ@2sPqjNnPd*aWGTOcvTbz6f`9d~EesD64uJ_igI3FX5i
z-eeD4;3=6TO!3Q<zS<9F5o}v)=AO3a0N4?F&Yo!+YBy61@Ft{uX7Y-Z!XY8??6T4k
zZuMB*i2nQ;^NGEK;(d1ZQ%<WHl>$TV<fz2NZMKg*&z@~pH8(s{{;I#y5jtYm=zeCq
z56p0NuiL}I#~q9ksK-&M$7qM<AtUEO1NR_PEl5IufjQQnXUQqJwp&V2y0|t?cdHg6
z4_QfPgvJV?&1raZ*dp2?wdlQFD*=NaKQ#!{%Q32Ov$0{q441}4#V~*6fhO-FW+r1*
z1$+@DEiZX~q}}JwY8iis2+<DC?LlD&5>Zds*Pek}TDE*5gi`f{7EheBY+hP?`?ScC
zI#{)aJG%&Ou8g2AsWmxay5AB*4UTOEGX~-O<U7NLP-x?aRPTuRVo%#$QeR=xj=RC8
znPWiUEWQ=4y~v$kV|Np?ent_Q{7tde_6pWUMFq#t-@nwj5ARt<a%yT=qsPSx@B?2D
z7E)n049yUWtW{;%I+P&+1<939?_BSTAO5aW|L%IijC070bL6<_quXMC#rybH)#lI-
zDl~U@kD!aC`o!LC8XHGm>b&E8Y?W=6`Eu*mYfne_oOU<k=RNaNd%Uv3zq$4>5r<q2
z%o~%*#kc>h_W=Ii2|nH($P9q#!lF&pnw*^c(P4AoRTn<1ZbuZg^wRF`$D<?LhLc`K
z*UeNHOj6RYygYi@WNx&Kj0^%nS2iC%xk;%AvanEWy0*zl{Is+**Q@o1xd~X8Nc~-Z
zuVp?#eNRx=XXn<RoArAM)EgY7Zy1(d-q`R)IU#8V!WZ4{tbjeZj&(Xpg;nLeV#7py
zw&U)1Ytx^OCS45-%1aR)8MOx=_Se8}W?g^~Z>$4hIydo08Mjc^i?xW5Avgo^eS-wR
zoo0dmoK&p>AZ{}E`f&q5hb&PcEx;h4f3cYSK5`spjGgAb^Ni_j8EiDIoVczoS(?WI
zpOJ|P6)i11F^_dX@@zj`naJIxAsDu(r2IIv(MX^lJ5AHQoCgmB9|;<GV$hW+roYL(
z>Km~O;zMZvPUoL|J!YTh!Mn<&d%r0I*4T)4r$5>@3<0dKjkhLYU~Peyevg(4LzES0
zWA&{;sYG$TWypE!$rP+K`=G&(SgVl!x_|^9sdd0#a<W#^uNtI}==Ftn$+EQV-`<w9
zSxkI;w_8(NYcQPoLZiY=@kPMPN8$pWE;K?WFzV}AnN-rOdfFGCNe_2clYuILnwazu
zI3O1YYBdQ``r0yNo|;{EJ@RHbEK9G|sQMwc1N%F1_#7@4<Fs!`!9HZC6b3w`ySUgX
zKc=VnzFMCUvG!9Ro5BzK&__wdV_l;7e*JA2XmI%#X~g(Kuv~)T*{eD6+~5r%5SC3k
z!=r(1^t0Rv;&4z7Lejf(3j8fsDdZfjuGG_^H%7L6!yhn{HvT|W1Y`L*e|=!+5};=I
zL{15IAs&xmuOB-3FF^4K;+U%hjk0L*SZ1Y-j^~IaYLM!oiai32hO0B~F9y=I4|_DR
zs*`Z<oU;_WOE(N}GG2h|+`}#joW=PQRf>nMIPh3Rg4<&sa$g5u5Q!)k)P2<a#OQEO
z&gu5O`(ywrY?$whUE(!$9r5Gd=wC+t@6DpW`z{~}%E^hu%`X1toE%O4j2utVmfSw^
zXHV47t>42o+@GVM!jmfv;$zXtNe4(P34bS4TF!9}emziBn&-*(SN{QgP^_B6qNc67
z`H}hw)`KzxB*fqvCmP%m1S&%gsBiLo{u6G@U_%X|O<*Y(MQi!Ht;FCG-jPbJfWS9)
zEb#|Hf(*-DxT6C%8KTYMUgVbWAJNvMEdf<?)-ggzbidyr>%A{I%RN}a=I%1tQTTW!
zV<pB3ZmDWEOr8*qU4+{@t2mO|MKvS+9ak!<J;wI3W^6dr7H4hYYpXB2<%3mg2EJN=
zJJUNJ!C8TNR+Fz}qx+W9>HnU%J(4hy(4(}0ErbErx=c#)@BIJY+He0@6bq}C{&7$4
zui0wj{MCti90<$n?LElfcGy}d*)*a)j3+k`b|Z-^&xMpDL6#<pFdFD&nN>vYFDls%
zZm=g9?Mh5dp`jHnFU7`z5+uPOAt>Xs5G9@JhTpZ=iR6R6cDtSL1{t%=TY+Vlk<zO%
zr0nK9KgVx*c)mV^0DV~zTVmuzUj&==BC^E@7lgfAsPPLTdSHPXX$^)O4zk|;6T_O=
zYs0KBz|H%o5#EUBYaQ=)x8a3g2Ti-6Aokujcy1zIn;K%@eYA^#;4%}d8Vpawq&O=X
zCog-U$9c~OHZAHof?dqmfgrl96w-&9AGba3b3ntrmhR5)&V4QYyUj0#<UL3wR&qY?
zFSswgZn$C$mM^}gd$e9&kfV21UGi$Mqy!d7RY=rgLKBwLwtD`Gl&BTrB0L{6(g-K_
z)tY^yaQRyuaQ*qBY*v4;H{fbWI054@_#)Y1X`*V?D%q$>gtXI3fHE5YZlt+nb{TK9
zvKs@syY`<hX#thdYZ?`_BvGAW%DuOVY?it%v%h=uG!=L(k&Rt(j1CS;I(5VkPKqf{
zPAO2~3GOs7Zk1W*sv-oor4fDSa`Z$eZ2&|ZU$Ma7eOJpCX7y)5>=o{b2YRzv<P}1{
z1!8(CW|Ai>XAR~`D-{G*7qyUST>GWbU-sy{u%#CyBSoqODE8hzE75I2Tpei6t|N>1
z<nw(}beq>@{eq2rPT5HIgHPK<AplAMxXi)3-F|pOQm9oC*d-y~mX;bim)_)m2CVRj
zBCg$^JA@+X8dSHM&S;w@RWUgZINGwJ0=M3?=W8VYM4~EI?-BiF|1AcD0%+fPg58jo
z)x}R@kyH`DyiIfh=paEb;U)6FYfX5c0M~?WBCNr7gNsM0^@zwe<lEW<7kZR7KiCOe
zZjkO@^ie3&zs7}u0NpTtU#y2}rcO5ugAE2>vWApeNhhH1!~HZNsJ038&Nif)wZHrH
zOOt1d(yac%iTCjNid&00l#id}FXkSzE80V)E?7u!cM{D+)bG=irnl;dMokxZke0Y4
z?Sk_)_kXp&V_$0gEJ+bS8}*%6N~}{XN8Xm6Z3I|jxGdV8&yd-_HY0oJvOp+o&h8_t
z-w}RM5Ea?^!A|2MvpTU(2)aXTv;ob>Z~f`d+;D-hSPQ2Si}oNcwu5PwA4m}PS`zlk
zuiC4O9F*DdZ?qWv7)VSXv|o>hV(B;amB`;C*yzUWE*Lc!r0CV?It<z5wF9J09Ds=U
z%v!ubqb(jG2c6h#EuDRn4s5s45fKlewbi>`PgXEh)Xg}`h?A3$3UNDiW|3D$cD}q{
zAZm-m7){#;HA?RlCavfzm3hpOyK#Ny;df(Yx>HVRDWb*R3OxanDr5Ja0>`)2IJ}ge
z&?cNwW#jZf-0Z{4lG$>017W)gKtD9-o;kL+(hELThDqhh7XFWd5gd7Jm^hSZjK;q8
z?<kL}7MF8R&{g_;Zm82AH(|s@@Ar7YfUUi@xc|64q#H6v0`d8(>d~!YZl>u1Q89=3
z*lng`I@hb{5t6~(au`CbGoR80`kbA-Si3#JR_gjh&$)Y{%SH~&`Ty!MjJ!Hf(O^yU
zpPNO{#r`Tjo8KiA5qN<1xNZB0otf{RLHjQYxL^hJAol$z@4jwc$DDrKt#eLeq)9r5
zfLc`IjdSOF<Z6jihCcuYp|_Bfn7nTlXo~-{b(?s6$gDISM)<=%Re-Z!v$ev8Zg2ZN
z8@T`~AQz3NBy{21{^k8R8Hg(e{1y0d9Hl<fs1Qsk82hHTu+11E&8x09^yblA#ztXE
zm6fK(ZSGeqI$ff%`2PU03R9vKwbe`x=ox!f8zVp|(w58mI%^DRL14Sf^Ea%0)9>sh
z(eFNIZEuYLZVX*Rz2+>BXVww`hXFe{oM1;!L&GwF!+LQgatRJ%{E*-7&}0}wPzLOj
zHvRXJ*SG2rNM9farno3=^t@uj2v=`OPm)%(@Db4k{Lgz5$&Gp&v4l_E*H_YcJ3K*J
zyXfGqvg(^Z0?Eha0T~OABY@ugDj>P%wTJGTz%#?pdY?}~Vl)U%U}gm#roj1V!n7YY
zQ<?V64}NHjwOf3H=%2CXUSB1qQKaNqwe~dllsyc-P78b7`C5n0<uE`tBjBqWaSeu-
zHbdX-@~#IN!u-Ejg31fTEUd5o^-z$wQ_~!KkJnE=3Eaa%@-lbDun163^Rc_{et7|A
z_2)tCg2?Qt0^jU5qv}^Y@>2`Gu9iWC!U#Y^)_hwLZ%k+)bBZDp0fpTO+)z|>#7WMn
z%U37Fk<W0B64{9f9Tp@P21UfbIs|vMQ}?c4yt}!^*siQP)TeK!CLJK=F7^j)9+G02
zfPUz&Rd`;K!tcBH<22*_FkTX#RR(~F<X@6tF!gJ;|GGf6T6?8jmmechds%_j!6lfX
zY{P1H8y@w=!vhjNmFNm0jAnQZaoXsxJXc)*Bcy#uaYbB%zFyIdxoVWy<OtHBt0@DB
z&*tT`p|dS@1(9V2d*G(3yJ=0h>4@M?cKf?lr#F)+h`@<ZPNQnTk+&DW(Feb^uV0M?
zT;&ozd~+)YV-Vv&B3NegAV!E4|Es?T3OWw*mb4&3ZSb95>|S@RLL?^7T_c=z(F}f!
zRuS9&Jk;m{DZONdPZxI9Aww0hebY_0LSlh|@@3=2w$*IUS=!L~R`88eGX!#?cH04a
z=oRue83XwrgCwCQX`OGoez*{_*6Syd)+|OuXgHJxLltH)7YJlQbA7quzlWW7pt{$F
zD$EfQU#o7VfS#{=-&g+zl=j+PEc)c=8*)1N(*{P@LpX~BC^icNArNp#m?qeBGfvP(
z><JkA{_7`jQ=_94pWq+pLcuKJfdsjK-5bEaKK#%cBnJUEXoXPqq#M)-`h39Gp-=Da
zt=JWRQPHaen2#4M?~E5BqM%54dN!1|=i9y_uXK1I2TDU0^{J%Ls#IRho7NSQ_f^Y1
z^rpd&yOu5#tBuuPb_EEMzA~eva*)oUwCgpuUyrwOwDi>eYf%8OqCT!XLHnE2Ny0)N
z&{JV-1fQFj)5`F`OH_sGU*ro>Sb4$D8PO4;MiS-`+#gO+AOGvNs$D4jBWM*Ucr`a~
zJ@ijf(d4E01Ykiug#5n%_Th`bf8UV(&q)5CDfa(B2tWMo+lN8m|M;gi`QHZmf8GE6
zXW9S%^LhV$dVkd);C}OeeO^vE%!5oysn>U*@>fWxt#o!Z5t%vPo;XFjepjs{Hh219
z>w>F9hBGPk+%S)3L{gKvS*(3F@i*SjW*r|^6KmoOo!V0WR7~?)kN1vJ?lEo=nD-xk
zs&NhWt6<%_vDPvG$zWTTn+pxvII^C|fj5?i5oug!=*)hCDqA`-fh<u63FXX$*TuMR
zkpFZW=H>r*o=^39hd+4jV44#<j<ly`u=H&=*KGEQ0b0Ws<sJycf5(;osmpy`!bf9i
zcFg$q@DQ^Yd)XZVh)B^2**x51=tMbyu>gR7@~MXCuG<QpMM$nC>_dEhc`~M1Z6iPw
zdX0}181*YOk8LGb^Y7B}9gbVWaUd--qthDv+5C>?e1c=hf(nz^i)2lFyVYV};4vmn
z#jOCe22Ny+eduXgViwc4w*2D(s&wU%Hdwe`eSeI<9`xsBjePK95+GdQMV&-ZWUF+c
z=xAgzhX<=^QdElR3o8+{8%G|ItOcxiy2b&nSv$_{jWSfLg5B&%Isf@1??KE8442^M
zH%PJK@I|k~DKKy~1GkSPvB@vZucmn(=U0o@^pO(uVeSlZdW25=>5%XoDX1n46X~ov
zcFA*i+Ug^Jo((`lGCjx8H=j5Z{U8h8R#oVM`bfHkT@);?Thh_K&cxx|vEFKe06iC*
zw_GU2tk>oJX9rgs>T&H|b1bi>S?!@+aIJ{qSz}LZug%s*snY!!`=px8yo;4$U2E?L
z8RK`>-AIE9v7(yk!w6}P(tV{g2?27R7a2_<p#Ba#7z7?uygMI<eW?;1YU{~56eOgN
zDM6=jvU|8Nj!cY<LDrJo2aGYMg>>D##=XU^G9Vs@H_B47eh02RfUfF7deKbiyNMQN
zx|Nva2c%qOxpjBFKjyxG{xedQTl3wVHS6%6pituCSH!8QuQ*mK(E%ukkFS$p>A4EG
zy=-{7WhFxwVWZ}HKWuS7OQb~=6htlcrxY0bI$45W)VjgY{Ycx&GkMvVV9+_n9NNt`
z)q79-$07`fe?3Re=2e+)e<@fdKzNg#9n^}nX(eJJi10c3(f9p@VrnAo%9$jK?Y9m)
z3s9T^sGqa3ABr))X6gD67q}HD^veXEk2?)n;Dnqgu5OzMCsZ?5HrPak<Y|xpQZ!W1
zk>^CV_b*n1N+#{*oU!Ge50Klmx1-O{FYl2Ov%dVI-feYV7iZPF#dUl^WeIw}fa34u
zvw5pXDO>FKh9>%R!>~6|a2;)O%QV1=t#n#+G>I$N*&$hDI2r2+@yV46?-a9Ex)qx2
zgQEDU95^P(SSIVd7ux*R``IY=VD&E;$k;EZ1~M!~<5O2d8&n%@*GBtP&2R;ITvR+t
zn#UI#%t2KE=-HGVv(H#o#l>NTlk{xO^7IeUBtb1*oaCOL*7{D`vJ60ShWf^v78<X4
z4Fjo@aubDLvX6t)p_<R3A-3=5{>B%}TuH7ph&^xNy7bZyDzsM3h{$TF5O+&=RH7i-
zbc5DHQpN48xTq^y&NF*;%82^S*Mvwz7J|V7kNik02KU57j(pl1(s->r!QfT02MLbh
zpMjarCz3dRvIV3Yef$!uu@=lFT?<KfruLxI59K8m&d%^A(gwsT(&2@Q>3nRyEqnO)
zn0Fz}Do5TGpE=IQ*gs3WvEi<7VWlhYT~7-M=}mq^)1GJ2G;-V~ls{$5ojbO_TK4mj
zkGp>D1B3|H{77Gjb?khyMJCH<oF&q#Y#E#+7^E6b0DGSSA1UZ3dzQa);3v25tK=s`
zxp8FAu?|9hskQ4c2ZOO_U9v1$hGijdx+<HrI#Yk@lC#pH3iDfPS8-GwjVFhMP>MMG
zDM87KEA96U4bmMO{&;`Ea?&$sPQ(+1RvGGGFbIQ&gOs01-MBLl(<#YPP!)XQ52y#)
zb##u<0%HUjZ=8@lxhYU7-Dzaie6gQNfnEt5&3_SLXjQO%v>4o$q1+Q?ShXx$fYhAY
z)7okg-p9v@=G+bfdPa@$Ey=%esAOM>?1VY)L;c%K2KuY~)&X?iyb&brx|wOp8q`12
z-2UdgRL#M63GB;mn`S|^EZVtU3a}KbI1OeeqR@nfhG_o?v*Ck?`qV#(;AyH=@lSqY
zrZ-Po)b4nxFO6J<|D46$9B0Hrujq+YA>(jWoxt6pByAI43}xyrc2WH2`uOsnQ&{l`
z$&E`%T%O~3>xC?152(oZpOPUqrC4p*))J_iE<LtHm*w_t8g_Th!v#U#HK#}fG-Y<B
zla;ftVULt{FB|o&k#tQwGPu^|JUu9ZU*JtL>bNU}<8T}Qkj&u%2quME#gjz;5Vl5M
z)2gusD>y~tzk6JYG`V%gJ+P3=4SjfTA)S)12cbsPCXQ(EkgYNMiXz~9`^IT)4G1Sk
z>8#X!TM3c#p2GO$^$21tj9caEa*Z)dLJu&vYY{6CE{@<Jwfn0mglGMxaFk1BM8O3%
z>h$lHol4Jo5-CrZV3MQ5{#;h5RImf3`}i66i@^$^7=2OCD!64`xISi;3#C_^|3Nk2
zA6V1ezWIU5@zwg3WM?yX>4Umu^HGTirg7fqk9|zu${dNSYq|+mnX+DsnzJlEZuLsX
zXRVH7D7F$@^0)<V`9n>0=<Z?Aio)iC^FI+zopa*0i9irmv0EEJ|EpJMZL>J;8N4bb
z#>1myL9n#}*dADFwz4BrC;g@v(Fz1C$TDAW4JNP0vs+t>5^m)CNl{9~^@Ix@UtKm&
zF)>Z0ejtx9e(hxb+x%ch_hDq7c7IjOiZm`P^PgbUPlwrM5g-KfbNCtVxJ=x>!o%+Q
z3*bVAPKU#^IK(gev5UxURpkR#S9Dl+IU?{rn(K;r)O#|uCrTG1e>3!eOVAcv8auQZ
z*~7TE#*rP1w<*Va7)`bj9+DLOZ!W6cax<TwFiTCaykHJe3)JtM>$bu|iy!!AKO5Xn
zBBMFM%qj4+*u}9zKuFOef8BL#)Wziq0!Kw-)3BzZl{a6alM9ddL;rF8KZFrK(xAlP
zCdh(7dl2RMGJn91YGj{Jwjkqq=jQ6>6q6C5&A@jrzyo<EaCb;h@*@QXO~X76c*&R`
zaX20E@$R-|iad{iw&7?k$y(xm9{v}x$Y5k$B0f+U%>Icx<@NKGN#$wYsCRXf)o(z*
zRD%`N1OIto&}^D;cOFdG_l?GKb1T|CRZG3cOy78Qe-l=lj{M|}Hesoy0<TjgnllOm
zt^VhD6fpi-WWn=V=D#?3Eq5&P0fr#7stPl`pE%{|ki=IdF@h5VnFjb#5d{59L!kgl
zatOr*1`u%Hz$!CdX>hH!=Gj<6l|@&__zx3}l8Jslw<K(<v25Q+x8^Pn)~;<uhAu`w
zJxQrpt3Ne<JVE-L=l6H~gM(lhj7vlAs~s)Lp_N!$7e81=lIwF;fQ5yI#E4N2Id2Do
zMVRQ?2E}IcBJOkqLm3`0H{%==-Y<<YAAK2m@UPD9+K8kz`UtI{a-QJ*1=o?@QIR9l
z1qOYd4QES<fn1c=d);)(#wr@RwhExS-A#4>_s|(3tZ|rG_gNaI8l&VJ^lwP&`a%HS
zRr5UqGn|+s>%T^MfuBfXZ)0O7aA6P7SLrm`&zkh^M1gHf2GUI%Z5YIQ$8QCT1PjG-
z!Lk`OZqIU%ZAZniFcIZe@z@UL(TTAe95Mcu34(LJfK$EgJaRKsi`oQxW9=nYr&hDO
zztQ4!XUog=FFiiCyIIBSD%nrE?<31zJBv+ODO|#df?XkF$*}r*04h_U<)0E|e)3a&
z6{Ts<rq2&0OVZk65zZpRY{T|AG@l=P3esPdUKO9J-D7-h6d<`iItfZGciATUvz|Ui
z!~sfGheh|*p-bd5RfS6g@zG3X&}lW5hp5IzXhz<gDCZS1RI@woXaTZsBN?!1u}|&+
z4fVY6D_JJa{#o!{nRG$~naPC`8eM;`Wrl|$-F?~e$2^JR^M9JYnb&?oLgNOf6?6Am
z=!?_j63eS7#%4}i!4XmuZMA_jJr(>lPTS8&iK}dUyZfK13?5x;(icj%6<N`BkD2G~
zazXEKeIC#%?w~wvCoC}qjAKqyv2f)N{%PWeF!*)%_^sc(-_}sAHi$Z_(D9J?K8{;a
zI<0?sJDDj^F&lNdPWO^j1UV69;l;syTwBRL##Aw#f9yE*(%n(?x(Bu-&EvZnAYwd#
z#`}UgG=oM*^fog``gpgkjDok<Ccc<~#EdaR=Kv7}X%hN@FEd|h_b$Dkgn^8FV0TZ@
z)e+bX2b&AUonrTwTYef;<_q)vn6X&@G`!YE92?=q=Sz@&mP#8m+9S0Y1<iHgC&lf5
zIXaKpNxb7z$ScyS2Yc+7uez>w)p3E;1^=aq43vk<WnTFSF{0RGVAMDPTU6tvo13wN
za#*ooL;3G)UOO=&;xS9A4Ep+ZmugUJg@xiG_YgUD_qQ-bBX_zW{O%8joVquP0rNpO
zVHO_*rBxLF@eoyfT(hyz-djS2iEn6u)vQJbWME&^Lk;iSalAf%4FcFig(UZ9q}JJ?
z&=&$P=Jrf)cV>0FjxNYcHaEpo3(;|)#3FZvpb|;W_hdB&(tQm^ZAwyv-eOh1RAKrX
zf5DgCbKbtWf$0kcdglf_e^Go+C(_>eJ@Ik#b;`1gV{uO^DdZ8_9#8Xx|9lU8r}bZH
z4&pD%fAIIgTmMtR{<nqxzi${7^wPNEGiwHPcfYKu1!^<olDVg<ZPFj#E`JySc+^p=
zGPGVd-``?j)4l2VwLNOLHAML!;{&&Pr9f#&xdio}3&Ar(IYaDHst6#Q=5_w|6A>5k
z+3sW)sG-Uj-9Fl{UgQ_x{LiJC?1k(|y5-ZKKpj=4bOf1FqBg(+{uU|$g;aD>4{z)J
zIUG%62GEyuU&+Y@_M1p3C`3xQDJWpRN#$2HB988XjqZ6$x~S1hNl6JcUZ7f7qtA%s
zVf~?8f}$X14dvjz`Ci36|B4&z1gUJRBxl+>BdYY+etXLB$&hBgH!bQ>(L#C^S8%Z)
zzzgsaAfS`bJJd5oFEwHxHeQgK45Ylxo3pN71$$0!Kv-c2WV*YhqpC|SBpe9$3CTNI
z)p#YT;^*0P!BPZ%>FnYnSUf{iN$InMo08HKP~h;<lEb(cM>d65kslo$J*daX5BywT
zUq7%@#*vW{7SuEZ4Gk%D8?l=POGpAL+qNlBsTc^mUQ=bxuJXPbP}2@Cd&*83K)<QM
zP{eID^Tla*;_}z1JQU8)4m1pmuBlSP=WZuPbkfo)4SRc*u5NCWpo9-p6+FD*o;R}0
z3yzLGJQiGDyX-z|tHvg_qCg(Js4OoO7{{!Y3EoblL?7zp<b=(9j2<uz{>SVpCJ%1!
zrjDSXp@Fk$zU2m`SHl(Wl`ZFLN{2cv{`QWf<o7SHX<VW7_ohk-1f0K>w^J}+he`Qw
zkLF5b4f6`%fd6en=;~7}#U5U@Cs^}jU9ap_Rm~s&8<0Ptka-<CHx2dJocXi<52yak
z^d4~hzpv{FOF0Y{S10Rc^L1RHBy?$eJJkJbXF1U{P0ZfjKJohZaThrjDJfd)>p)OU
z8dne|OUrm{+Vh#lI6N>UuK~1gW`RB^t9=p9ibl-M6n}@$q~QZbDL%vCATZbk$_Esh
zy}h;^`7f`oGE@uI68N2VNOep{vR@%0A^B>vbTJk;D80LFzWZIMvbvWe6MsNYMpf5r
z`)y6*Rc!JII1|2h1aeQGo@hG5wg99AE(=g-#Or;-8^@{_4yr0B+1N_Pyw*21R<?7~
zI}Ia*f@oyoT1H39RrZ~M!-aj@IZzAIaC6e<dUM>BQ<lVK5yy{Cm3h)(_c^5C2`CRP
z(yHc<*><e6-}Y$rgCk(mhx|U<-Bb{^oMPLXugAA(x}pWY6!hs6>fT~Ad7*l7X9}M~
zuVWY}(|{rOzN8ce<r)t%Mo^GKQ}uqKp|+jZ15D^ogdFg|qSpoK&O{MoY;Zt8%riWy
zI>7F6USOf3Lc<K|bg8AoI~v?hv&)*iu2;?`K`E;>tFm4^i;iE9QCqaUa40${e@vau
zY?T#CY+!IO{#)I*gy4=srKV}Hm?W;xs?pUF@2fSUHTx?eQmuhhfnd-F`r9Kp1kc|E
zs0ag&TM7-=2ld7WhhzE5;I7eXrx*+Cd_1R+kPzv?v>7KfgoxWR1Pt6bK6q11@fJ(&
zKQWfc;A=?J^}3(|WPPfy2nh*)c(*z4iZ)wLvv+iKw17ezVPWB|ksOrs{aL!y^yh}~
zL|o>ukgbJA0V8%olb;Dt5Vk~FSKze&p)P|0!}lSky2t@0<rJAXCb8Adu;q=7An*kn
z*;Ia9?&SXE22g6U+#Wn!ZKGFHUr)`?Pt+I3?676JIgq+FmX8fa=9kIc;XFlZCY`#m
zi~)Q-PhT*QM6-q|*x8>PHk^h_JlX85bUs`NOB3>Fo1Z5wZocCO-@lu+X@21kkM?EU
ze0g&-I3a-mbYipY#cRn}l&)9d(UPh<pbDomob=<v-Ev1M!Mm|G96^_rm67b+{@yJ%
zn=Ydf6ck+A-wy-L^jeQ2{L?2%ZEX@fX3e#d3Rx*Bc%MvD&s%|QHV`&A&BqYQ$jHEE
zdiz5l1^@xD+n%5^k52knVIVljaG-JSe($nEL_IwP(_B}OF0Zd83db{*bKmf~9_i-;
z2swng(%~ebL1@G)-~`0WP5PG(4#FpjwD9ZRyjuM-Y}U~cij74?gv`Uk0}9}93e}1j
zPBeEXi={z95%_V5^S-7A6J7)O6hsURAXq9(?Bz>Dcytntt$SRoSds8p62^RckiQgs
z)~qn|{qYf>nt=fs1|C(^*48%aj76s|0E=4ci%EYHTXO#;m{CLd%5)?`?l_eelbsxc
zg8pDCyz2<T0#!g*Njx^;;PwF&gv|TW07NU8(Oh|HP<L12ed{iG+<|>`3>=FsHhIZ>
zvb(#vO5l9|gjP1e$L(}ud95c}Y31F)TrIj&Fa~)zC~v}h08w>4uRu`ql?kFmo_aA^
zS$X+zGXQ`Ax0IXi?FUZ9(vpdtgCplW-TU`5P-q<-ujfq&j=cp$eKx~RR8UB@0t$)k
zYbI7BM8Y@IJOK2E>~-WPy}P@%`9vl}RNQz@1ZH>e&5h^YZ1rFUKxHpPLdW;!i7J;`
z;rKGIhzL1%GMdB2PcczZ$an2pKR$;I{iCJU%hN#-D9GkudRK`-`_YtP#B$@sg8#gA
zm&pAMH4Tkgk!GOx?Qcp@#Z}z&o59B~$C#4{O;8XJJlZKNUYU1Ud;vzm((<yRk#<i{
zkLyEP5D|TdiNX1q%!83C;35UiEao+h@bw<Y|LWz+gQ@=8_R%6z9F-`$ltQ5>AqpuH
zSwduOv1Ccv;^^B#XrskXN?9UXw#pu|w}*&ALJKOp99hnDefrJ(o@d@?=AC)}dH*qH
z%yB-;y<FFI-}i?x)?|(pa(Yy$3oBi*V#RC)1%<)E!6!I_`RJHt{O(Qed6yyh`py=s
zv?L!rRRgJ2s~p-2Ja4F-SWkNTkscQ;TR#Vj4Waasq??qL8O)<dGQ4D4=>5-u6O-OD
z63ODWolW#_&a|#9@a!IZXXPQTrY6+c+3AN=o$WW|@R&6-=~NfTW^7`T<NOxA!S{@(
zVx<xue6rXlfatJfjuD^Nj}`@^bhEW=TWNG7BO|hqF5r{uyqx#06_i6xDEulEU70(-
z;HH<-s$!{`HIZ)ZMSE%VGS*D7mT0)zaHtc2#+B*WbcEA*x@IU6FBZ{xR9HNSIW_Vo
z*esndH8oX}L%ejdUzKgEtmUJfY1eMulJQcxePc^N9zHQWInG7v>Z!lG-KN<kcRoc?
zLp^uHRjBKR(d)OTH1%mV-&FO@)GFc8m_lF5@1+pY3)fw~w#hR_vZ!o#th)8`@9xtR
zGm`_tefwmW<{YTyX4@L09%#uSUiCauW-jf@?c3I_EQB(Lmp2rGpR>lxSezv`ax{)$
zO>wxvx{oKm317K&%gWW(EPXF#2Kkq3kS;!IXdvGQsXlLTczBVnuC8%(z0(rxj6{05
z#&L2Mv_ESX*V8c27;7}a1WQ<VZ8(455zH89hF+~Lr)DO0(C8QV<$P9qG-uv+BKakk
z7P=+imvZBGgfhRu@_842#)kHb)IOgD-+q94o9Rj=*A}{zK@9bz$osqe$tgeJ82iqO
zV5hbMh08*lC7M)E3`?F{u<T4+oY?9m^HWTvvDxL0uVV_`ShqI1oyp3Q!w1>Zo1~{l
zf4pCeoAY7*K5FFi^Fwf3+kUmtIxX&>0i!)^XUk7vwW^H+P3cji9}skLLZRW|^Y#or
zOHNLfvY{A5+wWWC%v!T%4Y!-&ZI$50M$<o^{(@WQczO6?rFjNh9L1X9u6=cD(++=s
z6&(aW{JKIzgOxX~qn&xW`}1xgsjz;^GGpoF_<%37w>e9+lr<Bec;wvzgxWo+rlDbB
zY&7SKN3b_USP^Q<^S*U)p1$qzKql20!pqMea_Gfh_J~<KckiyY@+cuVO+ro%(+l>M
z?2kM;L~Lwq_DDxI<csNTc#SRcm6nz^2&C>=T~~PgoAFv+lfOJw6cv{&T&@^#8G)9E
z)}U<Fpj;3*=|fw6EM^OXnO!+h`Q{Ce+lNP<Db0^h9KUZ{CbHr1%O^9_)Z~lDW@@~V
z+_ldWT94mPe13}4Chb9^ixP=JWNKuvv$CbYbH(t;h{BO~vb3!R2HZ%L!371%FJm=C
zTk}0?XQn6X6Ll9m+mCf6-n%D(ye%F1yz?92+36-1Zws!Jf?r$9X^bP2Jv~meCy_Gd
zLVW=N0sKYzf(pNx6w_|x>#Mr&V}8TWq<DpdE+W2v0>q_>1+HDSdiB%zaKYN%-rnth
zb<|~8ZDO#d$CW+1=J=2IFN6nO6i`Umqxw&P<U3X<wAL!mi}^m!O;G2ez-c6<1J&pG
zS{^!vKYHDHY3MG_jtNc@5g8dQu60gKOpHb$^H!kMc$c@esHmvg#OG_wU#%XVy$vf#
z2XC^$?TSqujM=o7GD?Ge;qo8=cd~|-l7LOWe!TCdYk88ug9Fj*{xRM`**aa6%?xy|
z?M<j@u{t2@EcEi}(^Gm$u+}Usjcwbu(KVGBTP8XV$kGU?@OV7LPW`pc`aIUTLRnd0
zgX8NUdP3EtWI{u?#Xhfq%aNw!;hTi-*zToOyKjC%Qlgz|FZNxbt}aqG{Y&tsqO(NP
zi|5a;sxOqi43C&KYgXd+ZdOL3H^Y5FOWD*gSDJa2O%KD=w9&1VW%d1CMh*;0U;+Eo
z#J5<#pSjKQe$=2{j0R;>WCm8JbqhV~Ar|ft&khFvrn<tU2CEhuiYY1ap}Dp^h;wnA
zacUxU6yw!TJg;_38tr{>?28`B@V1PhVADLe);!Iz-=n=})dPQvsj3R1S-1)xA|%80
z{evX^=4;Om`c02DD+K&<b&j#lb>TxQ$fg{s=R0e~7Zem2k9|WYH9l;IlMQ|yd01+!
zSU8#W)2BNQTa#VNwSN8jPu<-sa&`6e&gic?zVrMNr5YE-<p_7Pi7mqw2;X!7&`&YC
z%YKJ3{A_)-uJ)nIoT~>`?&a1WG>*J}{kmz-;<bngGUk~(ZKLG{7Em<zlWFWr7%Q0#
zNxQgh(^u<(jv`=*Zp|>e3ov@<a+Y<mPhGDUf<|qGxYqNwQe`;$^zX6CiIHy#2wVb}
zbbwsvv9YmXWG$&O*X+IpTdw6L+-X!1Y?LBN9ZnfFle1Ey8IYcwoTI#eP|YTqMJa<i
zkuwIUJ2Y6yb70_O3Bfao!&Vp<)PkcS-#)U;(3-fEwWy<|rNK^qYm)Ki$3|t=3-bHw
z@6J2P?3~w_ZqC!+-=E|%GVsfHg8_eXisxWWbD??W{xF~mgS2AYk#qh;18DNnkAdUX
zjG=0NA;++Ow!dMP9r_Q_5_K*uxBv9ybWeNnCQVJvqho!0r@m>hwz;@S*My7m(41QH
z)&gM4AATvIe@AT@OsX1^0PoVJW)3Vw`Kl+UXV)hiit67~<h&%fNe5`vAV&E#dgMF5
zXO)$@1$cOPyu7KzMf%ABDvP{&X9a7X=Hg#x_v)q+#e^wBD$w)Jf_YZL+0GKrM3N5+
z3nR3*K3;1c`nuU@WKIwl0y0G>rw<H0h-}y$X>M~mHnziUGFClMrJ<prE@>D49Cr3D
z#1Im<RvE-tq%lKNj&&(N^Sqjp_Wk`sDOkwa_YWQK;$kf*Fu(Zd!!Y5w1ep`tm6V)A
zTKkcRKV|p(613?3-OTml<7FTeq36$60Fjbu&Wl2ujX#uZ!Pp{p8XOhHkHoO1I@_*%
z7NK$i>ko2}e>hOaDm5K4j8W!&5hb?+RDqaGP)G<M+1!Bf{_T{L(`sPOJzdisuapDR
zuhx_UHFm@P2#U6s7ub_*AUp-*Xvsao|L*=i69*Qw6P*i7*Cx)X{g8X)%9SgpF|`+|
zq9akXK}cq^neocbwk;n+V-BDXKEW_nT|!n?Kc&e9SWX(gxgyWKy>E|4<++6k+s?9A
zyn3~pQgm;#KsvDT>TlaOI?!R8X42R{sL5f!KDz2<^oH$TUXS*qH%W+zZT0&3VXv%J
z-u<UHj=tz0+%$!|Auw1oy=lIop<(^~eH#?qJ}BDfSOn2G`MMhF>UuggBP|Ryniz75
z2Pu2^T^CUCN=dOPDZ(^|grcG;IY3EDQd0TR1R&I(Z%Q?lP*dCg61cI&bz?8Xv)QuP
zCj*qNn1h3Zz8sE*6VL}1I)5c}|Kh*N5i!N!;^Kh#W55D7fn$4l>2$GC{}O?Xt~W^F
zr-_+m?q3r`cL0V=KpvNnl+-2%A|kR5#yvn~n@kOL*KV)9ESzNhsSM~1M=E~LFm@eI
zS88f{I#}l}uaZk6p}|WW-`w#I?VcX*;0GF9ta94`(8B~&`(B-&MdNFn+Lee1F^qbw
ztv1iFR8jyv&w*`ddb3J4Jf<fJCdXp3qCRfh?2uB#vcv$s1g~z&?&Qf*zb}#I+DDIO
z<D?T{;$7cjDW9JFlp~ztRnQg0Ec0B~AXWwy7Z($7#f03!)wCi(wKnGg4H)<SLCvE|
zhyD@SB+Mm!eQ5vIYP=l(LmK_BJ{#)4gvsg~;L2cuK*gp#ZIC|BJbn7~Sh1PA`#MNt
zg!gGCzbyxnf+|rnH8EnZxctRWm96E0C;a@bABol0UO55mSf6e#2N<iFVMf^78x5A)
z>zK_Z?#%^Wy^9FN9AM34wf&yTr+_ig(YV)wrR~M)+^~|@Xrk-*N+Wyn`h@9ww~kU_
zYI=+xF~eAVI{Dtc1js1`$G*(BIq`)LtP4*J!p9K#HRJc#O)-b~j=4!B1lSLMe&&ZP
zO)h|N6&TMG1nVJWhpsC-M9M+pZwpJ{VaDzaD=FUk_HKM3d2Y05p|7v6qEj91q2rs(
z?2w@-8-Gszb^D)SI=MdEUMux6q)LGehZhhXQoMPkL=peHEZcCTebKk~c9SWT#9{o&
zzA?p!fQ%RcVcz<Za!2TT#kJq`61vb9mavGR3afngYVbjKE4g*+C~i38SwxSv_V)T>
zUk@SZX;m9p;}k1|-^Q=JbK4ZVt*tG=fV7B+h*Mx#kTDuhnWe*D6hAUXc4HbcWTQ{9
z@W{6}gxP{%(}AKwMEp7S?c2vac3D{U93%yZTZ#bO;4=a7-{mmegFt=m)-Aybs-i+3
z7v18T*ZOfWZ+*tsSGPg{xv|WQrz0S)5q-HXP4j_2ITkFaI>k2o{M60%{`O*Wy?*}w
znpw?viG2L{#6vCNyY-=<B^9-`^B~L;bYYikDcl#Mc485a+Tbb0!{Y-TqM&@fDc3Oj
z1q#14t9gYOB}PMDkZ$DRHF6$`zWV06wwEt+zpkko>{3tO?g@>cXaFPGJOd;|*uj~~
z5S{}=UDeFa5YdRg{yK*f?*sv=&TB0VR1Ko{fZ>OE0*8`OE1XF!!l{CDgCsPWB~VSy
zXq6B~j<2l1W*|jSmf&g}{v{%Xg@wk#7pl*|I1YS%dc^|xWY+B23XrD~lah43$#}Hm
zofGV2)(Mees7BDk4s-=lp-WiKB3`yrO)k|Cx9Up*d{a!*THjp)TtEuSIs9rl1E43n
z^`}!u>6V7KZ<AD1efzb+we8kN4~{icw%zdd8ZwuS1fe>rgv-EW6`>?V<RRAqmBmtp
z>a3WXIso196C^5aJ-zuwz61RcpZq|zb6lFFU*1;bCj<2$=}ToT_NbQ$Nu(WP>OX_^
z6&+_}N=ly=OOPNe63P`9I4hFwTw0FrfDI)cL??6(w8*&KP<=uhx-_q#piE>^QW7WJ
zLBX@D${|a^w|_tAriypk%OS!(8576iO{KTn*xUiL#ffu8>#qX3Xm9<<Ps?#{S4sT=
zf<5aL6A3z)u6fYWk&B0iM**}yBoB<Tu+Ak{LP;t2<<KG{s_EK|8>?xd&`zULZ#TK{
zO-xK+vRaGa6yp=1nA?%;gPUB|K4`y`^CLb)<k;$gw!()bCwQqjRB;&H)mex%nfT!I
z=YycF;t;(ggXoyATug{6w3Qn1OpN1|*Gfr9bE%sQM_&aGjg<*=4@VQ6p8ZoQLfok(
zJHApyBmV;oh-i&K^SXz?uzCO$e15bTIk1x6Z#MZeLmvkT1&arz6HsR;-#3$4x4(c!
zYbo-U38D*Z@gH@Yy!zq`IDUwi(6VKmP;Qw_KfEnwT^xa-LE@9(-oJYR-4?LVzAUO?
z<M0^upH0^fUu=Eo$m9R(2PYnWSRJVcZ~grBtDbH0i#Km-3D7|f-4?&6EicQa#DB9;
zbC#{`@(!9EqK<%~6aBhgl49uulNq<~;bFp4Xm+fbX*?+WG(y~16-cZ6?7XO7d10aR
z5nf~0g!S|f7G6zpLXkTXFq*0acqLaRgydW|0SOs{*L>1E^XDI9E`M4U930HHH9qU~
zl0y)l{SZrsp3LSUxD6E}QJnRhI6G@G+Rk0O&Kjp`+u40`n{2@Gq&IONa>=#qlLB|3
z)q!t<zV}K&Fr~Rq@@<ny5S*Ht`t<dyS(kt>H8Ff>w6BQ^n${l-*54KerDTP?{GR1e
zNRoE>t$;3;UEU=nCBm0IggZ{1QE<mnxVvxZB~?J$O&VH@DiCHz0nWGs`IO!*=8aq$
zyJkXPSKIg8n@H{aWG^Jc%q~O=z`hOgARkDL$}uBjW7Viva8ZBgL{^qZPM}X;Bj@_)
z1w`|y{1K9He}Ca3LJk84N~9vIYid*)hek%uHo0s^%^{5EbN=xaUu{oL%xyv>^ir3W
z?z=p>Dj`iP)igmXguCUzAud?Q_2&tqsvF(gLLo^26UsGcJpv=%dDt%?Kx<u8H{ysd
zB^(8I^Lu<C9N8wdZgYtZ4~<kEsvWlJ=$xyp^fNYYu(pj2P1}gh<0`nb^jdZEMeQOO
zFNwU0(ge9Z#2DzGjh*}T^%o%Ce;wR<2e6Qc|Ip>Ce=QRcxolr~t`h>G+^F3`T6A<Y
z;jgqOcJfPZQsTs!L%IPXx2?L?Sv*iGGcw(t_7CUT0gan$8ikSey)120Z&bB-0nBe~
za5T8`4R*+LwwxBN|25mb<~*N_kk3*dU*8?YK0mX;_=-QCC_%y`br2}BW=@QBlVomM
z93Ug@6n^ObbloUumPOeFnm4bK==$3<UlY^x!=Rxld$`7oGQk^=FW=hNRD;qD0{7en
zf+JJ5u%2@eKDVZtc7XsCy2Zu@{#r(|1BwxLsKManl-V>pLZ|>!NxAINk!EhfRit7W
zXINl2Db~ds34fwuRDEB^XW=TkgZXWq5b<Sn)XQt&qc8%IMZUW*Dh1+!fmxCtKYk>I
z9nkO~IJH-A!`%77vj{rC<_2-JTFGxCe@5-l-fLWTa#|i4hw##zoE*Q=`W>AE1L4re
zx`@(mX0{aS4tt!PY~akqH&3doiW3TJR-Jj**Vnf%kQX>`Xnws(QQ*2~VM^s49in(V
z#Vhr|&CSPGS?0O~1CDeTe!GLRC>`~=9JkhuP&j$RxBL?5Yt9M>d-_B;QN5G)!Gn@S
zuD$W<>+sYV-H5N+QBU1uk<t61!mB+SV+tz;jSl%x-!IqZ|3(#IE-gejJeb}E8r%i?
zvBbZ`24SfFp`)SaXivSdwT!B&6}F_+h~NW0#(CR73X54uN=we0UdO};DIEK}vlINB
z!C+K9e4{S&F4J1(k94>z@V)ECA^gu!2te_O6F|CtpRerDHZyzYMh(1p@nRP+eS7>5
zfSW}bmbr^8Gt7W3&O_l3bAEe|^Fp<8+9Yby<l!7rHLhrFwL(DQUAAn^9ct!;=dU08
zki=l8iwRE08!`!yA{?OV0}^Y(=WF6)p<kaz6rPVogBpO(W-y_@6QV+?+JLod-J%AJ
z<$~zY7kR<^vIj>-7K3hR>*$;ZPzgnX+~tjER0S~%T%(x$8P$L#q_*a(x+-D)-;p(i
zfs;*<kA})4SEB!K1nztO$Unni|Ff5#`p;&7|NmZq^UnX5VS#_P^uNv~q_F1wtdxGW
UtLYAAo@q4Q?FQPJns#UY1)k4>4FCWD


From 962010c670220c8a6f33b763a47e3f1d1bb79ced Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 24 Oct 2025 06:17:12 +0000
Subject: [PATCH 05/48] address reviewer feedback

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 fastsafetensors/common.py            | 12 ++--
 fastsafetensors/cpp/cuda_compat.h    | 14 ++--
 fastsafetensors/cpp/ext.cpp          | 40 +++++++++++-
 fastsafetensors/cpp/ext.hpp          |  5 +-
 fastsafetensors/dlpack.py            | 47 ++++++++------
 fastsafetensors/frameworks/_torch.py | 13 +++-
 fastsafetensors/loader.py            |  8 ++-
 setup.py                             | 31 +++++----
 tests/conftest.py                    |  4 +-
 tests/platform_utils.py              | 95 ++++++++++++++++++----------
 tests/test_fastsafetensors.py        | 35 ++++++----
 tests/test_multi.py                  |  5 +-
 12 files changed, 214 insertions(+), 95 deletions(-)

diff --git a/fastsafetensors/common.py b/fastsafetensors/common.py
index 7dcd581..33446a0 100644
--- a/fastsafetensors/common.py
+++ b/fastsafetensors/common.py
@@ -13,10 +13,14 @@
 from .frameworks import FrameworkOpBase, TensorBase
 from .st_types import Device, DType
 
-# Add compatibility alias for is_cuda_found -> is_hip_found
-# This allows code written for CUDA to work transparently on both CUDA and ROCm
-if not hasattr(fstcpp, 'is_cuda_found'):
-    fstcpp.is_cuda_found = fstcpp.is_hip_found
+
+def is_gpu_found():
+    """Check if any GPU (CUDA or HIP) is available.
+
+    Returns True if either CUDA or ROCm/HIP GPUs are detected.
+    This allows code to work transparently across both platforms.
+    """
+    return fstcpp.is_cuda_found() or fstcpp.is_hip_found()
 
 
 def get_device_numa_node(device: Optional[int]) -> Optional[int]:
diff --git a/fastsafetensors/cpp/cuda_compat.h b/fastsafetensors/cpp/cuda_compat.h
index 0c3cc69..f430ec3 100644
--- a/fastsafetensors/cpp/cuda_compat.h
+++ b/fastsafetensors/cpp/cuda_compat.h
@@ -1,21 +1,25 @@
+// SPDX-License-Identifier: Apache-2.0
 /*
  * Copyright 2024 IBM Inc. All rights reserved
- * SPDX-License-Identifier: Apache-2.0
  *
  * CUDA/HIP compatibility layer for fastsafetensors
  * Minimal compatibility header - only defines what hipify-perl doesn't handle
  */
 
-#pragma once
+#ifndef __CUDA_COMPAT_H__
+#define __CUDA_COMPAT_H__
 
 // Platform detection - this gets hipified to check __HIP_PLATFORM_AMD__
 #ifdef __HIP_PLATFORM_AMD__
   #ifndef USE_ROCM
     #define USE_ROCM
   #endif
-  #include <hip/hip_runtime.h>
+  // Note: We do NOT include <hip/hip_runtime.h> here to avoid compile-time dependencies.
+  // Instead, we dynamically load the ROCm runtime library (libamdhip64.so) at runtime
+  // using dlopen(), just like we do for CUDA (libcudart.so).
+  // Minimal types are defined in ext.hpp.
 #else
-  // For CUDA platform, or when CUDA headers aren't available, we define minimal types in ext.hpp
+  // For CUDA platform, we also avoid including headers and define minimal types in ext.hpp
 #endif
 
 // Runtime library name - hipify-perl doesn't change string literals
@@ -31,3 +35,5 @@
   #define cudaDeviceMalloc hipDeviceMalloc
   #define cudaDeviceFree hipDeviceFree
 #endif
+
+#endif // __CUDA_COMPAT_H__
diff --git a/fastsafetensors/cpp/ext.cpp b/fastsafetensors/cpp/ext.cpp
index f48d937..bd15650 100644
--- a/fastsafetensors/cpp/ext.cpp
+++ b/fastsafetensors/cpp/ext.cpp
@@ -79,6 +79,7 @@ ext_funcs_t cpu_fns = ext_funcs_t {
 ext_funcs_t cuda_fns;
 
 static bool cuda_found = false;
+static bool is_hip_runtime = false;  // Track if we loaded HIP (not auto-hipified)
 static bool cufile_found = false;
 
 static int cufile_ver = 0;
@@ -123,8 +124,12 @@ static void load_nvidia_functions() {
                 count = 0; // why cudaGetDeviceCount returns non-zero for errors?
             }
             cuda_found = count > 0;
+            // Detect if we loaded HIP runtime (ROCm) vs CUDA runtime
+            if (cuda_found && std::string(cudartLib).find("hip") != std::string::npos) {
+                is_hip_runtime = true;
+            }
             if (init_log) {
-                fprintf(stderr, "[DEBUG] device count=%d, cuda_found=%d\n", count, cuda_found);
+                fprintf(stderr, "[DEBUG] device count=%d, cuda_found=%d, is_hip_runtime=%d\n", count, cuda_found, is_hip_runtime);
             }
         } else {
             cuda_found = false;
@@ -218,11 +223,28 @@ static void load_nvidia_functions() {
     }
 }
 
+// Note: is_cuda_found gets auto-hipified to is_hip_found on ROCm builds
+// So this function will be is_hip_found() after hipification on ROCm
 bool is_cuda_found()
 {
     return cuda_found;
 }
 
+// Separate function that always returns false on ROCm (CUDA not available on ROCm)
+// This will be used for the "is_cuda_found" Python export on ROCm builds
+bool cuda_not_available()
+{
+    return false;  // On ROCm, CUDA is never available
+}
+
+// Separate function for checking HIP runtime detection (not hipified)
+// On CUDA: checks if HIP runtime was detected
+// On ROCm: not used (is_cuda_found gets hipified to is_hip_found)
+bool check_hip_runtime()
+{
+    return is_hip_runtime;
+}
+
 bool is_cufile_found()
 {
     return cufile_found;
@@ -719,7 +741,21 @@ cpp_metrics_t get_cpp_metrics() {
 
 PYBIND11_MODULE(__MOD_NAME__, m)
 {
-    m.def("is_cuda_found", &is_cuda_found);
+    // Export both is_cuda_found and is_hip_found on all platforms
+    // Use string concatenation to prevent hipify from converting the export names
+#ifdef USE_ROCM
+    // On ROCm after hipify:
+    // - is_cuda_found() becomes is_hip_found(), so export it as "is_hip_found"
+    // - Export cuda_not_available() as "is_cuda_found" (CUDA not available on ROCm)
+    m.def(("is_" "cuda" "_found"), &cuda_not_available);  // Returns false on ROCm
+    m.def(("is_" "hip" "_found"), &is_cuda_found);  // hipified to is_hip_found, returns hip status
+#else
+    // On CUDA:
+    // - is_cuda_found() checks for CUDA
+    // - check_hip_runtime() checks if HIP runtime was loaded
+    m.def(("is_" "cuda" "_found"), &is_cuda_found);
+    m.def(("is_" "hip" "_found"), &check_hip_runtime);
+#endif
     m.def("is_cufile_found", &is_cufile_found);
     m.def("cufile_version", &cufile_version);
     m.def("set_debug_log", &set_debug_log);
diff --git a/fastsafetensors/cpp/ext.hpp b/fastsafetensors/cpp/ext.hpp
index 2f7c5d9..961011f 100644
--- a/fastsafetensors/cpp/ext.hpp
+++ b/fastsafetensors/cpp/ext.hpp
@@ -36,11 +36,10 @@ typedef struct CUfileDescr_t {
 } CUfileDescr_t;
 typedef struct CUfileError { CUfileOpError err; } CUfileError_t;
 
-// Only define minimal CUDA types if not using ROCm (where real headers are included)
-#ifndef USE_ROCM
+// Define minimal CUDA/HIP types for both platforms to avoid compile-time dependencies
+// We load all GPU functions dynamically at runtime via dlopen()
 typedef enum cudaError { cudaSuccess = 0, cudaErrorMemoryAllocation = 2 } cudaError_t;
 enum cudaMemcpyKind { cudaMemcpyHostToDevice=2, cudaMemcpyDefault = 4 };
-#endif
 
 
 typedef enum CUfileFeatureFlags {
diff --git a/fastsafetensors/dlpack.py b/fastsafetensors/dlpack.py
index 1d4338e..e8883ed 100644
--- a/fastsafetensors/dlpack.py
+++ b/fastsafetensors/dlpack.py
@@ -12,26 +12,43 @@
 _c_str_dltensor = b"dltensor"
 
 
-# Detect GPU type at module load time
+# Lazy GPU type detection - avoid calling framework-specific code at module load time
+_GPU_DEVICE_TYPE = None  # Will be detected lazily
+
+
 def _detect_gpu_type():
-    """Detect if we're running on ROCm or CUDA"""
-    try:
-        import torch
-        if torch.cuda.is_available():
-            # Check if this is ROCm build
-            if hasattr(torch.version, 'hip') and torch.version.hip is not None:
-                return 10  # kDLROCM
-    except:
-        pass
+    """Detect if we're running on ROCm or CUDA.
+
+    This detection is now done lazily to avoid framework-specific calls at module load time.
+    Uses the C++ extension's is_hip_found() to determine the platform.
+    """
+    # Import here to avoid circular dependency
+    from . import cpp as fstcpp
+
+    # Check if we loaded HIP runtime (ROCm)
+    if fstcpp.is_hip_found():
+        return 10  # kDLROCM
     return 2  # kDLCUDA
 
 
-_GPU_DEVICE_TYPE = _detect_gpu_type()
+def _get_gpu_device_type():
+    """Get the GPU device type, detecting it lazily if needed."""
+    global _GPU_DEVICE_TYPE
+    if _GPU_DEVICE_TYPE is None:
+        _GPU_DEVICE_TYPE = _detect_gpu_type()
+    return _GPU_DEVICE_TYPE
 
 
 class DLDevice(ctypes.Structure):
     def __init__(self, dev: Device):
-        self.device_type = self.DeviceToDL[dev.type]
+        # Use lazy detection to get the GPU device type
+        gpu_type = _get_gpu_device_type()
+        device_to_dl = {
+            DeviceType.CPU: self.kDLCPU,
+            DeviceType.CUDA: gpu_type,
+            DeviceType.GPU: gpu_type,
+        }
+        self.device_type = device_to_dl[dev.type]
         self.device_id = dev.index if dev.index is not None else 0
 
     kDLCPU = 1
@@ -42,12 +59,6 @@ def __init__(self, dev: Device):
         ("device_id", ctypes.c_int),
     ]
 
-    DeviceToDL = {
-        DeviceType.CPU: kDLCPU,
-        DeviceType.CUDA: _GPU_DEVICE_TYPE,
-        DeviceType.GPU: _GPU_DEVICE_TYPE,
-    }
-
 
 class c_DLDataType(ctypes.Structure):
     def __init__(self, dtype: DType):
diff --git a/fastsafetensors/frameworks/_torch.py b/fastsafetensors/frameworks/_torch.py
index 1487153..affa214 100644
--- a/fastsafetensors/frameworks/_torch.py
+++ b/fastsafetensors/frameworks/_torch.py
@@ -186,9 +186,18 @@ def copy_tensor(self, dst: TorchTensor, src: TorchTensor):
         dst.real_tensor.copy_(src.real_tensor)
 
     def get_cuda_ver(self) -> str:
+        """Get GPU runtime version with platform indicator.
+
+        Returns a string like 'hip-5.7.0' for ROCm or 'cuda-12.1' for CUDA,
+        or 'none' if no GPU is available. This allows code to distinguish
+        between different GPU platforms without using torch directly.
+        """
         if torch.cuda.is_available():
-            return str(torch.version.cuda)
-        return "0.0"
+            # Check if this is ROCm/HIP build
+            if hasattr(torch.version, "hip") and torch.version.hip is not None:
+                return f"hip-{torch.version.hip}"
+            return f"cuda-{torch.version.cuda}"
+        return "none"
 
     def get_device_ptr_align(self) -> int:
         CUDA_PTR_ALIGN: int = 16
diff --git a/fastsafetensors/loader.py b/fastsafetensors/loader.py
index 60959fa..9e7e526 100644
--- a/fastsafetensors/loader.py
+++ b/fastsafetensors/loader.py
@@ -6,7 +6,7 @@
 from typing import Any, Dict, List, Optional, OrderedDict, Tuple, Union
 
 from . import cpp as fstcpp
-from .common import SafeTensorsMetadata, TensorFrame, get_device_numa_node
+from .common import SafeTensorsMetadata, TensorFrame, get_device_numa_node, is_gpu_found
 from .file_buffer import FilesBufferOnDevice
 from .frameworks import TensorBase, get_framework_op
 from .st_types import DeviceType, DType
@@ -69,8 +69,10 @@ def __init__(
             gl_set_numa = True
         fstcpp.set_debug_log(debug_log)
         device_is_not_cpu = self.device.type != DeviceType.CPU
-        if device_is_not_cpu and not fstcpp.is_cuda_found():
-            raise Exception("[FAIL] libcudart.so does not exist")
+        if device_is_not_cpu and not is_gpu_found():
+            raise Exception(
+                "[FAIL] GPU runtime library (libcudart.so or libamdhip64.so) does not exist"
+            )
         if not fstcpp.is_cufile_found() and not nogds:
             warnings.warn(
                 "libcufile.so does not exist but nogds is False. use nogds=True",
diff --git a/setup.py b/setup.py
index adecf4e..dbc7e6e 100644
--- a/setup.py
+++ b/setup.py
@@ -27,6 +27,7 @@ def detect_platform():
         for path in ["/opt/rocm", "/opt/rocm-*"]:
             if "*" in path:
                 import glob
+
                 matches = sorted(glob.glob(path), reverse=True)
                 if matches:
                     rocm_path = matches[0]
@@ -45,14 +46,14 @@ def detect_platform():
                 rocm_version = f.read().strip()
         else:
             # Try to extract version from path
-            match = re.search(r'rocm[-/](\d+\.\d+(?:\.\d+)?)', rocm_path)
+            match = re.search(r"rocm[-/](\d+\.\d+(?:\.\d+)?)", rocm_path)
             if match:
                 rocm_version = match.group(1)
 
         print(f"Detected ROCm platform at {rocm_path}")
         if rocm_version:
             print(f"ROCm version: {rocm_version}")
-        return ('rocm', rocm_version, rocm_path)
+        return ("rocm", rocm_version, rocm_path)
 
     # Check for CUDA
     cuda_home = os.environ.get("CUDA_HOME") or os.environ.get("CUDA_PATH")
@@ -64,11 +65,11 @@ def detect_platform():
 
     if cuda_home and os.path.exists(cuda_home):
         print(f"Detected CUDA platform at {cuda_home}")
-        return ('cuda', None, None)
+        return ("cuda", None, None)
 
     # Default to CUDA if nothing detected
     print("No GPU platform detected, defaulting to CUDA")
-    return ('cuda', None, None)
+    return ("cuda", None, None)
 
 
 def hipify_source_files(rocm_path):
@@ -110,7 +111,7 @@ def hipify_source_files(rocm_path):
 
     hipified_files = []
     for source_path, result in hipify_result.items():
-        if hasattr(result, 'hipified_path') and result.hipified_path:
+        if hasattr(result, "hipified_path") and result.hipified_path:
             print(f"Successfully hipified: {source_path} -> {result.hipified_path}")
             hipified_files.append(result.hipified_path)
 
@@ -126,8 +127,9 @@ def hipify_source_files(rocm_path):
     return hipified_files
 
 
-
-def MyExtension(name, sources, mod_name, platform_type, rocm_path=None, *args, **kwargs):
+def MyExtension(
+    name, sources, mod_name, platform_type, rocm_path=None, *args, **kwargs
+):
     import pybind11
 
     pybind11_path = os.path.dirname(pybind11.__file__)
@@ -143,7 +145,7 @@ def MyExtension(name, sources, mod_name, platform_type, rocm_path=None, *args, *
     kwargs["extra_compile_args"] = ["-fvisibility=hidden", "-std=c++17"]
 
     # Platform-specific configuration
-    if platform_type == 'rocm' and rocm_path:
+    if platform_type == "rocm" and rocm_path:
         # ROCm/HIP configuration
         kwargs["define_macros"].append(("__HIP_PLATFORM_AMD__", "1"))
         kwargs["libraries"].append("amdhip64")
@@ -168,7 +170,7 @@ def run(self):
         self.rocm_path = rocm_path
 
         #  Configure build based on platform
-        if platform_type == 'rocm' and rocm_path:
+        if platform_type == "rocm" and rocm_path:
             print("=" * 60)
             print("Building for AMD ROCm platform")
             if rocm_version:
@@ -182,9 +184,14 @@ def run(self):
             for ext in self.extensions:
                 new_sources = []
                 for src in ext.sources:
-                    if 'fastsafetensors/cpp/ext.cpp' in src:
+                    if "fastsafetensors/cpp/ext.cpp" in src:
                         # torch.utils.hipify creates files in hip/ subdirectory
-                        new_sources.append(src.replace('fastsafetensors/cpp/ext.cpp', 'fastsafetensors/cpp/hip/ext.cpp'))
+                        new_sources.append(
+                            src.replace(
+                                "fastsafetensors/cpp/ext.cpp",
+                                "fastsafetensors/cpp/hip/ext.cpp",
+                            )
+                        )
                     else:
                         new_sources.append(src)
                 ext.sources = new_sources
@@ -234,6 +241,6 @@ def run(self):
         )
     ],
     cmdclass={
-        'build_ext': CustomBuildExt,
+        "build_ext": CustomBuildExt,
     },
 )
diff --git a/tests/conftest.py b/tests/conftest.py
index 5960d3c..ba054d0 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -6,6 +6,7 @@
 
 from fastsafetensors import SingleGroup
 from fastsafetensors import cpp as fstcpp
+from fastsafetensors.common import is_gpu_found
 from fastsafetensors.cpp import load_nvidia_functions
 from fastsafetensors.frameworks import FrameworkOpBase, get_framework_op
 from fastsafetensors.st_types import Device
@@ -14,6 +15,7 @@
 TESTS_DIR = os.path.dirname(__file__)
 sys.path.insert(0, TESTS_DIR)
 from platform_utils import get_platform_info, is_rocm_platform
+
 REPO_ROOT = os.path.dirname(os.path.dirname(TESTS_DIR))
 DATA_DIR = os.path.join(REPO_ROOT, ".testdata")
 TF_DIR = os.path.join(DATA_DIR, "transformers_cache")
@@ -81,7 +83,7 @@ def pg():
 
 @pytest.fixture(scope="session", autouse=True)
 def dev_init() -> None:
-    if fstcpp.is_cuda_found():
+    if is_gpu_found():
         dev_str = "cuda:0" if FRAMEWORK.get_name() == "pytorch" else "gpu:0"
     else:
         dev_str = "cpu"
diff --git a/tests/platform_utils.py b/tests/platform_utils.py
index a7c8c31..e0b4498 100644
--- a/tests/platform_utils.py
+++ b/tests/platform_utils.py
@@ -1,5 +1,5 @@
-# Copyright 2024 IBM Inc. All rights reserved
 # SPDX-License-Identifier: Apache-2.0
+# Copyright 2024 IBM Inc. All rights reserved
 
 """Utilities for platform detection and conditional test execution."""
 
@@ -7,15 +7,16 @@
 
 
 def is_rocm_platform():
-    """Detect if running on ROCm/AMD platform."""
+    """Detect if running on ROCm/AMD platform.
+
+    Uses the C++ extension's is_hip_found() to avoid framework-specific calls.
+    """
     try:
-        import torch
-        if torch.cuda.is_available():
-            if hasattr(torch.version, 'hip') and torch.version.hip is not None:
-                return True
+        from fastsafetensors import cpp as fstcpp
+
+        return fstcpp.is_hip_found()
     except:
-        pass
-    return False
+        return False
 
 
 def is_cuda_platform():
@@ -25,26 +26,28 @@ def is_cuda_platform():
 
 # List of tests that are expected to fail on ROCm (based on TEST_RESULTS.md)
 ROCM_EXPECTED_FAILURES = {
-    'test_GdsFileCopier',  # GDS not available on AMD
+    "test_GdsFileCopier",  # GDS not available on AMD
 }
 
 # List of tests with memory leak detection issues on ROCm (non-critical)
 ROCM_MEMORY_LEAK_TESTS = {
-    'test_SafeTensorsFileLoader',
-    'test_SafeTensorsFileLoaderNoGds',
-    'test_fastsafe_open',
-    'test_int8',
-    'test_float8_e5m2',
-    'test_float8_e4m3fn',
-    'test_float8_e4m3fn_to_int8',
-    'test_cpp_metrics',
+    "test_SafeTensorsFileLoader",
+    "test_SafeTensorsFileLoaderNoGds",
+    "test_fastsafe_open",
+    "test_int8",
+    "test_float8_e5m2",
+    "test_float8_e4m3fn",
+    "test_float8_e4m3fn_to_int8",
+    "test_cpp_metrics",
 }
 
 
 def skip_if_rocm_expected_failure(test_name):
     """Skip test if it's an expected failure on ROCm."""
     if is_rocm_platform() and test_name in ROCM_EXPECTED_FAILURES:
-        pytest.skip(f"Test '{test_name}' is expected to fail on ROCm (GDS not supported)")
+        pytest.skip(
+            f"Test '{test_name}' is expected to fail on ROCm (GDS not supported)"
+        )
 
 
 def xfail_if_rocm_memory_leak(test_name):
@@ -52,29 +55,57 @@ def xfail_if_rocm_memory_leak(test_name):
     if is_rocm_platform() and test_name in ROCM_MEMORY_LEAK_TESTS:
         return pytest.mark.xfail(
             reason=f"Test '{test_name}' has memory leak detection issues on ROCm (non-critical)",
-            strict=False
+            strict=False,
         )
     return lambda func: func
 
 
 def get_platform_info():
-    """Get platform information for debugging."""
+    """Get platform information for debugging.
+
+    Uses framework's get_cuda_ver() to avoid direct torch calls where possible.
+    """
     info = {
-        'is_rocm': is_rocm_platform(),
-        'is_cuda': is_cuda_platform(),
+        "is_rocm": is_rocm_platform(),
+        "is_cuda": is_cuda_platform(),
     }
 
     try:
-        import torch
-        if torch.cuda.is_available():
-            info['torch_version'] = torch.__version__
-            if is_rocm_platform():
-                info['hip_version'] = torch.version.hip
-                info['rocm_version'] = torch.version.hip
-            else:
-                info['cuda_version'] = torch.version.cuda
-            info['device_count'] = torch.cuda.device_count()
-            info['device_name'] = torch.cuda.get_device_name(0) if torch.cuda.device_count() > 0 else None
+        from fastsafetensors import cpp as fstcpp
+        from fastsafetensors.common import is_gpu_found
+
+        if is_gpu_found():
+            # Get version info from framework
+            try:
+                from fastsafetensors.frameworks import get_framework_op
+
+                framework = get_framework_op("pytorch")
+                gpu_ver = framework.get_cuda_ver()
+                info["gpu_version"] = gpu_ver
+
+                # Parse the version to get specific info
+                if gpu_ver.startswith("hip-"):
+                    info["hip_version"] = gpu_ver[4:]  # Remove 'hip-' prefix
+                    info["rocm_version"] = gpu_ver[4:]
+                elif gpu_ver.startswith("cuda-"):
+                    info["cuda_version"] = gpu_ver[5:]  # Remove 'cuda-' prefix
+            except:
+                pass
+
+            # Get device count and name (still needs torch for this)
+            try:
+                import torch
+
+                if torch.cuda.is_available():
+                    info["torch_version"] = torch.__version__
+                    info["device_count"] = torch.cuda.device_count()
+                    info["device_name"] = (
+                        torch.cuda.get_device_name(0)
+                        if torch.cuda.device_count() > 0
+                        else None
+                    )
+            except:
+                pass
     except:
         pass
 
diff --git a/tests/test_fastsafetensors.py b/tests/test_fastsafetensors.py
index 1606571..118e2ca 100644
--- a/tests/test_fastsafetensors.py
+++ b/tests/test_fastsafetensors.py
@@ -11,7 +11,7 @@
 from fastsafetensors import SafeTensorsFileLoader, SafeTensorsMetadata, SingleGroup
 from fastsafetensors import cpp as fstcpp
 from fastsafetensors import fastsafe_open
-from fastsafetensors.common import get_device_numa_node
+from fastsafetensors.common import get_device_numa_node, is_gpu_found
 from fastsafetensors.copier.gds import GdsFileCopier
 from fastsafetensors.copier.nogds import NoGdsFileCopier
 from fastsafetensors.dlpack import from_cuda_buffer
@@ -63,7 +63,7 @@ def save_safetensors_file(
 
 
 def get_and_check_device(framework: FrameworkOpBase):
-    dev_is_gpu = fstcpp.is_cuda_found()
+    dev_is_gpu = is_gpu_found()
     device = "cpu"
     if dev_is_gpu:
         if framework.get_name() == "pytorch":
@@ -110,18 +110,29 @@ def test_framework(fstcpp_log, framework) -> None:
         framework.is_equal(t, [float(0.0)])
     with pytest.raises(Exception):
         framework.get_process_group(int(0))
+    # Test that get_cuda_ver() returns a string with platform prefix
+    cuda_ver = framework.get_cuda_ver()
+    assert isinstance(cuda_ver, str)
+    # Should be "hip-X.Y.Z", "cuda-X.Y", or "none"
+    assert (
+        cuda_ver.startswith("hip-")
+        or cuda_ver.startswith("cuda-")
+        or cuda_ver == "none"
+    )
+
+    # Verify it matches what torch reports
     if framework.get_name() == "pytorch":
         import torch
 
-        cuda_ver = str(torch.version.cuda) if torch.cuda.is_available() else "0.0"
-    elif framework.get_name() == "paddle":
-        import paddle
-
-        if paddle.device.is_compiled_with_cuda():
-            cuda_ver = str(paddle.version.cuda())
+        if torch.cuda.is_available():
+            if hasattr(torch.version, "hip") and torch.version.hip:
+                assert cuda_ver.startswith("hip-")
+                assert str(torch.version.hip) in cuda_ver
+            else:
+                assert cuda_ver.startswith("cuda-")
+                assert str(torch.version.cuda) in cuda_ver
         else:
-            cuda_ver = "0.0"
-    assert framework.get_cuda_ver() == cuda_ver
+            assert cuda_ver == "none"
 
 
 def test_get_framework_fail(fstcpp_log) -> None:
@@ -233,10 +244,10 @@ def test_close_gds(fstcpp_log) -> None:
 
 def test_get_device_pci_bus(fstcpp_log) -> None:
     bus = fstcpp.get_device_pci_bus(0)
-    if not fstcpp.is_cuda_found():
+    if not is_gpu_found():
         assert bus == ""
     else:
-        print(f"bus for cuda:0: {bus}")
+        print(f"bus for gpu:0: {bus}")
         assert len(bus) > 0
 
 
diff --git a/tests/test_multi.py b/tests/test_multi.py
index b80b2f9..12b95cf 100644
--- a/tests/test_multi.py
+++ b/tests/test_multi.py
@@ -5,6 +5,7 @@
 
 from fastsafetensors import SafeTensorsFileLoader
 from fastsafetensors import cpp as fstcpp
+from fastsafetensors.common import is_gpu_found
 
 
 def test_shuffle(fstcpp_log, input_files, pg, framework):
@@ -14,13 +15,13 @@ def test_shuffle(fstcpp_log, input_files, pg, framework):
 
         rank = pg.rank()
         world_size = pg.size()
-        device = "cuda:0" if fstcpp.is_cuda_found() else "cpu"
+        device = "cuda:0" if is_gpu_found() else "cpu"
     elif framework.get_name() == "paddle":
         from safetensors.paddle import load_file
 
         rank = pg.process_group.rank()
         world_size = pg.process_group.size()
-        device = "gpu:0" if fstcpp.is_cuda_found() else "cpu"
+        device = "gpu:0" if is_gpu_found() else "cpu"
     else:
         raise Exception(f"Unknown framework: {framework.get_name()}")
     loader = SafeTensorsFileLoader(

From f7e617d4d5747e3dc8b92bb8f63fb268d6405e58 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 14:08:55 +0000
Subject: [PATCH 06/48] remove torch dependencies

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 setup.py          | 95 +++++++++++++++++++++++++++++++----------------
 tests/conftest.py |  3 +-
 2 files changed, 63 insertions(+), 35 deletions(-)

diff --git a/setup.py b/setup.py
index dbc7e6e..b513c58 100644
--- a/setup.py
+++ b/setup.py
@@ -4,6 +4,7 @@
 import os
 import re
 import shutil
+import subprocess
 from pathlib import Path
 
 from setuptools import Extension, setup
@@ -74,7 +75,7 @@ def detect_platform():
 
 def hipify_source_files(rocm_path):
     """
-    Automatically hipify CUDA source files to HIP using torch.utils.hipify.
+    Automatically hipify CUDA source files to HIP using hipify-perl from ROCm.
     The cuda_compat.h header handles what hipify doesn't convert.
 
     Args:
@@ -83,46 +84,74 @@ def hipify_source_files(rocm_path):
     Returns:
         list: Paths to hipified source files
     """
-    from torch.utils.hipify.hipify_python import hipify
-
     cpp_dir = Path("fastsafetensors/cpp").resolve()
+    hip_dir = cpp_dir / "hip"
 
-    # Prepare source files for hipification
-    extra_files = [
-        str(cpp_dir / "ext.cpp"),
-        str(cpp_dir / "ext.hpp"),
-    ]
+    # Create hip/ subdirectory if it doesn't exist
+    hip_dir.mkdir(exist_ok=True)
+
+    # Find hipify-perl in ROCm installation
+    hipify_perl = os.path.join(rocm_path, "bin", "hipify-perl")
+    if not os.path.exists(hipify_perl):
+        raise RuntimeError(
+            f"hipify-perl not found at {hipify_perl}. "
+            f"Please ensure ROCm is properly installed at {rocm_path}"
+        )
 
-    print(f"Hipifying files using torch.utils.hipify:")
-    for f in extra_files:
-        print(f"  - {f}")
-
-    # Use torch's hipify - similar to vLLM's approach
-    hipify_result = hipify(
-        project_directory=str(cpp_dir.parent),
-        output_directory=str(cpp_dir),
-        header_include_dirs=[],
-        includes=[f"{cpp_dir}/*"],
-        extra_files=extra_files,
-        show_detailed=False,
-        is_pytorch_extension=False,
-        hipify_extra_files_only=True,
-    )
+    # Files to hipify
+    source_files = [
+        ("ext.cpp", "ext.cpp"),
+        ("ext.hpp", "ext.hpp"),
+    ]
 
+    print(f"Hipifying files using hipify-perl from {hipify_perl}:")
     hipified_files = []
-    for source_path, result in hipify_result.items():
-        if hasattr(result, "hipified_path") and result.hipified_path:
-            print(f"Successfully hipified: {source_path} -> {result.hipified_path}")
-            hipified_files.append(result.hipified_path)
+
+    for src_name, dst_name in source_files:
+        src_path = cpp_dir / src_name
+        dst_path = hip_dir / dst_name
+
+        print(f"  - {src_path} -> {dst_path}")
+
+        try:
+            # Run hipify-perl: hipify-perl input.cpp -o output.cpp
+            result = subprocess.run(
+                [hipify_perl, str(src_path), "-o", str(dst_path)],
+                check=True,
+                capture_output=True,
+                text=True,
+            )
+            print(f"    Successfully hipified: {src_name}")
+            hipified_files.append(str(dst_path))
+
+            # Print any warnings from hipify-perl
+            if result.stderr:
+                print(f"    hipify-perl output: {result.stderr.strip()}")
+
+            # Post-process: Replace cuda_compat.h with hip_compat.h
+            # hipify-perl doesn't convert custom header names
+            with open(dst_path, "r") as f:
+                content = f.read()
+            content = content.replace(
+                '#include "cuda_compat.h"', '#include "hip_compat.h"'
+            )
+            with open(dst_path, "w") as f:
+                f.write(content)
+            print(f"    Post-processed: cuda_compat.h -> hip_compat.h")
+
+        except subprocess.CalledProcessError as e:
+            raise RuntimeError(
+                f"Failed to hipify {src_path}:\n"
+                f"stdout: {e.stdout}\n"
+                f"stderr: {e.stderr}"
+            ) from e
 
     # Copy cuda_compat.h to hip directory as hip_compat.h
     # (hipify converts the include statement from cuda_compat.h to hip_compat.h)
-    hip_dir = cpp_dir / "hip"
-    if hip_dir.exists():
-        cuda_compat = cpp_dir / "cuda_compat.h"
-        hip_compat = hip_dir / "hip_compat.h"
-        shutil.copy2(cuda_compat, hip_compat)
-        print(f"Copied {cuda_compat} -> {hip_compat}")
+    cuda_compat = cpp_dir / "cuda_compat.h"
+    hip_compat = hip_dir / "hip_compat.h"
+    shutil.copy2(cuda_compat, hip_compat)
+    print(f"Copied {cuda_compat} -> {hip_compat}")
 
     return hipified_files
 
diff --git a/tests/conftest.py b/tests/conftest.py
index ba054d0..af4d27f 100644
--- a/tests/conftest.py
+++ b/tests/conftest.py
@@ -13,8 +13,7 @@
 
 # Add tests directory to path to import platform_utils
 TESTS_DIR = os.path.dirname(__file__)
-sys.path.insert(0, TESTS_DIR)
-from platform_utils import get_platform_info, is_rocm_platform
+from platform_utils import get_platform_info
 
 REPO_ROOT = os.path.dirname(os.path.dirname(TESTS_DIR))
 DATA_DIR = os.path.join(REPO_ROOT, ".testdata")

From 72eb7854a076e558c49c8e6fb7e3d575f4ff7895 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 19:12:37 +0000
Subject: [PATCH 07/48] handle when cuda and rocm not found

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 fastsafetensors/copier/gds.py     | 28 ++++++++++++++++++++--------
 fastsafetensors/cpp/cuda_compat.h |  2 --
 2 files changed, 20 insertions(+), 10 deletions(-)

diff --git a/fastsafetensors/copier/gds.py b/fastsafetensors/copier/gds.py
index 5f2ec3a..dc24f1f 100644
--- a/fastsafetensors/copier/gds.py
+++ b/fastsafetensors/copier/gds.py
@@ -28,15 +28,27 @@ def __init__(
         self.copy_reqs: Dict[int, int] = {}
         self.aligned_length = 0
         cuda_ver = framework.get_cuda_ver()
-        if cuda_ver and cuda_ver != "None":
-            cudavers = list(map(int, cuda_ver.split(".")))
-            # CUDA 12.2 (GDS version 1.7) introduces support for non O_DIRECT file descriptors
-            # Compatible with CUDA 11.x
-            self.o_direct = not (
-                cudavers[0] > 12 or (cudavers[0] == 12 and cudavers[1] >= 2)
-            )
+        if cuda_ver and cuda_ver != "none":
+            # Parse version string (e.g., "cuda-12.1" or "hip-5.7.0")
+            # Extract the numeric part after the platform prefix
+            ver_parts = cuda_ver.split("-", 1)
+            if len(ver_parts) == 2:
+                cudavers = list(map(int, ver_parts[1].split(".")))
+                # CUDA 12.2 (GDS version 1.7) introduces support for non O_DIRECT file descriptors
+                # Compatible with CUDA 11.x
+                # Only applies to CUDA platform (not ROCm/HIP)
+                if ver_parts[0] == "cuda":
+                    self.o_direct = not (
+                        cudavers[0] > 12 or (cudavers[0] == 12 and cudavers[1] >= 2)
+                    )
+                else:
+                    # ROCm/HIP platform, use O_DIRECT
+                    self.o_direct = True
+            else:
+                # Fallback if format is unexpected
+                self.o_direct = True
         else:
-            # ROCm or non-CUDA platform, use O_DIRECT
+            # No GPU platform detected, use O_DIRECT
             self.o_direct = True
 
     def set_o_direct(self, enable: bool):
diff --git a/fastsafetensors/cpp/cuda_compat.h b/fastsafetensors/cpp/cuda_compat.h
index f430ec3..021e7f4 100644
--- a/fastsafetensors/cpp/cuda_compat.h
+++ b/fastsafetensors/cpp/cuda_compat.h
@@ -1,7 +1,5 @@
 // SPDX-License-Identifier: Apache-2.0
 /*
- * Copyright 2024 IBM Inc. All rights reserved
- *
  * CUDA/HIP compatibility layer for fastsafetensors
  * Minimal compatibility header - only defines what hipify-perl doesn't handle
  */

From 6ddba67ea8e0e6a19392495f6e4905e0e35683d6 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 19:23:15 +0000
Subject: [PATCH 08/48] fix paddle paddle

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 fastsafetensors/frameworks/_paddle.py | 17 ++++++++++++-----
 1 file changed, 12 insertions(+), 5 deletions(-)

diff --git a/fastsafetensors/frameworks/_paddle.py b/fastsafetensors/frameworks/_paddle.py
index 13f5eec..7592d31 100644
--- a/fastsafetensors/frameworks/_paddle.py
+++ b/fastsafetensors/frameworks/_paddle.py
@@ -214,11 +214,18 @@ def copy_tensor(self, dst: PaddleTensor, src: PaddleTensor) -> None:
         dst.device = src.device
 
     def get_cuda_ver(self) -> str:
-        return (
-            str(paddle.version.cuda())
-            if paddle.device.is_compiled_with_cuda()
-            else "0.0"
-        )
+        """Get GPU runtime version with platform indicator.
+
+        Returns a string like 'hip-5.7.0' for ROCm or 'cuda-12.1' for CUDA,
+        or 'none' if no GPU is available. This allows code to distinguish
+        between different GPU platforms without using paddle directly.
+        """
+        if paddle.device.is_compiled_with_cuda():
+            # Check if this is ROCm/HIP build
+            if paddle.device.is_compiled_with_rocm():
+                return f"hip-{paddle.version.cuda()}"
+            return f"cuda-{paddle.version.cuda()}"
+        return "none"
 
     def get_device_ptr_align(self) -> int:
         CUDA_PTR_ALIGN: int = 16

From 8714185372b2c7cfbacb48d7903581a185eadcc3 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 19:40:32 +0000
Subject: [PATCH 09/48] setup rocm wheel ci build

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 234 +++++++++++++++++++++++
 1 file changed, 234 insertions(+)
 create mode 100644 .github/workflows/build-rocm-wheels.yaml

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
new file mode 100644
index 0000000..3ff78b7
--- /dev/null
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -0,0 +1,234 @@
+name: Build ROCm wheels
+
+on:
+  workflow_dispatch:
+  push:
+    branches: [main]
+    paths:
+      - 'fastsafetensors/cpp/**'
+      - 'setup.py'
+      - '.github/workflows/build-rocm-wheels.yaml'
+  pull_request:
+    branches: [main]
+    paths:
+      - 'fastsafetensors/cpp/**'
+      - 'setup.py'
+      - '.github/workflows/build-rocm-wheels.yaml'
+
+permissions:
+  contents: read
+
+jobs:
+  build-rocm-wheels:
+    name: Build ROCm wheel - Python ${{ matrix.python-version }}
+    runs-on: ubuntu-latest
+    container:
+      image: rocm/dev-ubuntu-22.04:7.0
+      options: --user root
+    strategy:
+      fail-fast: false
+      matrix:
+        python-version: ["3.9", "3.10", "3.11", "3.12", "3.13"]
+
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@v4
+
+      - name: Install system dependencies and hipify-perl
+        run: |
+          apt-get update
+          apt-get install -y \
+            wget \
+            build-essential \
+            libnuma-dev \
+            gcc \
+            g++ \
+            make \
+            git \
+            curl \
+            ca-certificates \
+            hipify-perl \
+            libssl-dev \
+            zlib1g-dev \
+            libbz2-dev \
+            libreadline-dev \
+            libsqlite3-dev \
+            libncursesw5-dev \
+            xz-utils \
+            tk-dev \
+            libxml2-dev \
+            libxmlsec1-dev \
+            libffi-dev \
+            liblzma-dev \
+            software-properties-common
+
+          # Verify hipify-perl is available
+          which hipify-perl || echo "Warning: hipify-perl not found"
+
+      - name: Install Python ${{ matrix.python-version }}
+        run: |
+          # Install Python from deadsnakes PPA for Ubuntu 22.04
+          add-apt-repository -y ppa:deadsnakes/ppa
+          apt-get update
+
+          # Install specific Python version and dev packages
+          PY_VER="${{ matrix.python-version }}"
+          apt-get install -y \
+            python${PY_VER} \
+            python${PY_VER}-dev \
+            python${PY_VER}-distutils || true
+
+          # Install pip for this Python version
+          curl -sS https://bootstrap.pypa.io/get-pip.py | python${PY_VER}
+
+          # Create symlink for easier access
+          update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PY_VER} 1
+          update-alternatives --set python3 /usr/bin/python${PY_VER}
+
+          # Verify installation
+          python3 --version
+          python3 -m pip --version
+
+      - name: Install Python build dependencies
+        run: |
+          python3 -m pip install --upgrade pip setuptools wheel
+          python3 -m pip install build setuptools_scm pybind11 numpy
+
+      - name: Set ROCm environment variables
+        run: |
+          echo "ROCM_PATH=/opt/rocm" >> $GITHUB_ENV
+          echo "HIP_PATH=/opt/rocm/hip" >> $GITHUB_ENV
+          echo "/opt/rocm/bin" >> $GITHUB_PATH
+          echo "/opt/rocm/hip/bin" >> $GITHUB_PATH
+
+          # Verify ROCm installation
+          ls -la /opt/rocm/ || echo "Warning: /opt/rocm not found"
+          hipify-perl --version || echo "Warning: hipify-perl not working"
+
+      - name: Build wheel for ROCm
+        run: |
+          # The setup.py should detect ROCm and use hipify-perl automatically
+          python3 -m pip wheel . -w wheelhouse/ --no-deps -v
+        env:
+          ROCM_PATH: /opt/rocm
+          HIP_PATH: /opt/rocm/hip
+
+      - name: List built wheels
+        run: |
+          ls -lah wheelhouse/
+
+      - name: Rename wheel to include rocm tag
+        run: |
+          cd wheelhouse
+          for wheel in *.whl; do
+            if [ -f "$wheel" ]; then
+              # Rename to include rocm tag before platform
+              # e.g., fastsafetensors-X.Y.Z-cp39-cp39-linux_x86_64.whl
+              # becomes fastsafetensors-X.Y.Z-cp39-cp39-rocm_linux_x86_64.whl
+              NEW_NAME=$(echo "$wheel" | sed "s/-linux_/-rocm_linux_/")
+
+              if [ "$wheel" != "$NEW_NAME" ]; then
+                mv "$wheel" "$NEW_NAME"
+                echo "Renamed: $wheel -> $NEW_NAME"
+              fi
+            fi
+          done
+          ls -lah
+
+      - name: Upload wheel artifact
+        uses: actions/upload-artifact@v4
+        with:
+          name: rocm-wheel-py${{ matrix.python-version }}
+          path: wheelhouse/*.whl
+          if-no-files-found: error
+
+  test-rocm-wheels:
+    name: Test ROCm wheel - Python ${{ matrix.python-version }}
+    needs: build-rocm-wheels
+    runs-on: ubuntu-latest
+    container:
+      image: rocm/dev-ubuntu-22.04:7.0
+      options: --user root
+    strategy:
+      fail-fast: false
+      matrix:
+        python-version: ["3.9", "3.10", "3.11", "3.12", "3.13"]
+
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@v4
+
+      - name: Install Python ${{ matrix.python-version }}
+        run: |
+          apt-get update
+          apt-get install -y software-properties-common
+          add-apt-repository -y ppa:deadsnakes/ppa
+          apt-get update
+
+          PY_VER="${{ matrix.python-version }}"
+          apt-get install -y \
+            python${PY_VER} \
+            python${PY_VER}-dev \
+            python${PY_VER}-distutils || true
+
+          curl -sS https://bootstrap.pypa.io/get-pip.py | python${PY_VER}
+          update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PY_VER} 1
+          update-alternatives --set python3 /usr/bin/python${PY_VER}
+
+          python3 --version
+
+      - name: Download wheel
+        uses: actions/download-artifact@v4
+        with:
+          name: rocm-wheel-py${{ matrix.python-version }}
+          path: wheelhouse/
+
+      - name: Install wheel and test dependencies
+        run: |
+          python3 -m pip install --upgrade pip
+          python3 -m pip install wheelhouse/*.whl
+
+          # Install test dependencies
+          python3 -m pip install pytest safetensors transformers numpy
+
+          # Install PyTorch with ROCm support for testing
+          python3 -m pip install torch --index-url https://download.pytorch.org/whl/rocm6.2 || \
+          python3 -m pip install torch --index-url https://download.pytorch.org/whl/cpu
+
+      - name: Run basic import test
+        run: |
+          python3 -c "import fastsafetensors; print('Import successful')"
+          python3 -c "from fastsafetensors import SafeTensorsFileLoader; print('SafeTensorsFileLoader imported')"
+          python3 -c "from fastsafetensors.frameworks import get_framework_op; fw = get_framework_op('pytorch'); print(f'PyTorch framework: {fw.get_name()}')"
+          python3 -c "from fastsafetensors.frameworks import get_framework_op; fw = get_framework_op('pytorch'); ver = fw.get_cuda_ver(); print(f'CUDA/ROCm version: {ver}')"
+
+      - name: Run basic tests
+        run: |
+          cd tests
+          export TEST_FASTSAFETENSORS_FRAMEWORK=pytorch
+          python3 -m pytest -xvs test_fastsafetensors.py::test_device
+          python3 -m pytest -xvs test_fastsafetensors.py::test_framework
+
+  collect-wheels:
+    name: Collect all ROCm wheels
+    needs: test-rocm-wheels
+    runs-on: ubuntu-latest
+
+    steps:
+      - name: Download all wheel artifacts
+        uses: actions/download-artifact@v4
+        with:
+          path: all-wheels/
+          pattern: rocm-wheel-*
+          merge-multiple: true
+
+      - name: List all wheels
+        run: |
+          echo "Built ROCm wheels:"
+          ls -lah all-wheels/
+
+      - name: Upload combined artifact
+        uses: actions/upload-artifact@v4
+        with:
+          name: rocm-wheels-all
+          path: all-wheels/*.whl

From 5fb3a142f97e56f73c3770a6178bcc1b736d8d49 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 19:42:06 +0000
Subject: [PATCH 10/48] manual trigger rocm workflow

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 12 ------------
 1 file changed, 12 deletions(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index 3ff78b7..5703d48 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -2,18 +2,6 @@ name: Build ROCm wheels
 
 on:
   workflow_dispatch:
-  push:
-    branches: [main]
-    paths:
-      - 'fastsafetensors/cpp/**'
-      - 'setup.py'
-      - '.github/workflows/build-rocm-wheels.yaml'
-  pull_request:
-    branches: [main]
-    paths:
-      - 'fastsafetensors/cpp/**'
-      - 'setup.py'
-      - '.github/workflows/build-rocm-wheels.yaml'
 
 permissions:
   contents: read

From 5e2e4afa76df18d7a4fe8231b8771cf70afa44fe Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 19:49:37 +0000
Subject: [PATCH 11/48] remove system package steps

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 34 ------------------------
 1 file changed, 34 deletions(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index 5703d48..fff2f56 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -3,9 +3,6 @@ name: Build ROCm wheels
 on:
   workflow_dispatch:
 
-permissions:
-  contents: read
-
 jobs:
   build-rocm-wheels:
     name: Build ROCm wheel - Python ${{ matrix.python-version }}
@@ -22,37 +19,6 @@ jobs:
       - name: Checkout code
         uses: actions/checkout@v4
 
-      - name: Install system dependencies and hipify-perl
-        run: |
-          apt-get update
-          apt-get install -y \
-            wget \
-            build-essential \
-            libnuma-dev \
-            gcc \
-            g++ \
-            make \
-            git \
-            curl \
-            ca-certificates \
-            hipify-perl \
-            libssl-dev \
-            zlib1g-dev \
-            libbz2-dev \
-            libreadline-dev \
-            libsqlite3-dev \
-            libncursesw5-dev \
-            xz-utils \
-            tk-dev \
-            libxml2-dev \
-            libxmlsec1-dev \
-            libffi-dev \
-            liblzma-dev \
-            software-properties-common
-
-          # Verify hipify-perl is available
-          which hipify-perl || echo "Warning: hipify-perl not found"
-
       - name: Install Python ${{ matrix.python-version }}
         run: |
           # Install Python from deadsnakes PPA for Ubuntu 22.04

From 75530b5d28b636ec55ac08889e5e4ae098eddb22 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 19:55:22 +0000
Subject: [PATCH 12/48] install system dependencies

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 15 +++++++++++++++
 1 file changed, 15 insertions(+)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index fff2f56..94d5a99 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -19,6 +19,21 @@ jobs:
       - name: Checkout code
         uses: actions/checkout@v4
 
+      - name: Install system dependencies
+        run: |
+          apt-get update
+          apt-get install -y \
+            software-properties-common \
+            wget \
+            build-essential \
+            libnuma-dev \
+            gcc \
+            g++ \
+            make \
+            git \
+            curl \
+            ca-certificates
+
       - name: Install Python ${{ matrix.python-version }}
         run: |
           # Install Python from deadsnakes PPA for Ubuntu 22.04

From 6ad6bb2dd7597666be8cd73a3eef7be2a72e8baf Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 20:04:51 +0000
Subject: [PATCH 13/48] upgrade ubuntu version, skip tests

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 77 +++---------------------
 1 file changed, 9 insertions(+), 68 deletions(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index 94d5a99..ad043b8 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -21,6 +21,10 @@ jobs:
 
       - name: Install system dependencies
         run: |
+          # Prevent interactive prompts during package installation
+          export DEBIAN_FRONTEND=noninteractive
+          export TZ=Etc/UTC
+
           apt-get update
           apt-get install -y \
             software-properties-common \
@@ -36,6 +40,10 @@ jobs:
 
       - name: Install Python ${{ matrix.python-version }}
         run: |
+          # Prevent interactive prompts during package installation
+          export DEBIAN_FRONTEND=noninteractive
+          export TZ=Etc/UTC
+
           # Install Python from deadsnakes PPA for Ubuntu 22.04
           add-apt-repository -y ppa:deadsnakes/ppa
           apt-get update
@@ -111,76 +119,9 @@ jobs:
           path: wheelhouse/*.whl
           if-no-files-found: error
 
-  test-rocm-wheels:
-    name: Test ROCm wheel - Python ${{ matrix.python-version }}
-    needs: build-rocm-wheels
-    runs-on: ubuntu-latest
-    container:
-      image: rocm/dev-ubuntu-22.04:7.0
-      options: --user root
-    strategy:
-      fail-fast: false
-      matrix:
-        python-version: ["3.9", "3.10", "3.11", "3.12", "3.13"]
-
-    steps:
-      - name: Checkout code
-        uses: actions/checkout@v4
-
-      - name: Install Python ${{ matrix.python-version }}
-        run: |
-          apt-get update
-          apt-get install -y software-properties-common
-          add-apt-repository -y ppa:deadsnakes/ppa
-          apt-get update
-
-          PY_VER="${{ matrix.python-version }}"
-          apt-get install -y \
-            python${PY_VER} \
-            python${PY_VER}-dev \
-            python${PY_VER}-distutils || true
-
-          curl -sS https://bootstrap.pypa.io/get-pip.py | python${PY_VER}
-          update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PY_VER} 1
-          update-alternatives --set python3 /usr/bin/python${PY_VER}
-
-          python3 --version
-
-      - name: Download wheel
-        uses: actions/download-artifact@v4
-        with:
-          name: rocm-wheel-py${{ matrix.python-version }}
-          path: wheelhouse/
-
-      - name: Install wheel and test dependencies
-        run: |
-          python3 -m pip install --upgrade pip
-          python3 -m pip install wheelhouse/*.whl
-
-          # Install test dependencies
-          python3 -m pip install pytest safetensors transformers numpy
-
-          # Install PyTorch with ROCm support for testing
-          python3 -m pip install torch --index-url https://download.pytorch.org/whl/rocm6.2 || \
-          python3 -m pip install torch --index-url https://download.pytorch.org/whl/cpu
-
-      - name: Run basic import test
-        run: |
-          python3 -c "import fastsafetensors; print('Import successful')"
-          python3 -c "from fastsafetensors import SafeTensorsFileLoader; print('SafeTensorsFileLoader imported')"
-          python3 -c "from fastsafetensors.frameworks import get_framework_op; fw = get_framework_op('pytorch'); print(f'PyTorch framework: {fw.get_name()}')"
-          python3 -c "from fastsafetensors.frameworks import get_framework_op; fw = get_framework_op('pytorch'); ver = fw.get_cuda_ver(); print(f'CUDA/ROCm version: {ver}')"
-
-      - name: Run basic tests
-        run: |
-          cd tests
-          export TEST_FASTSAFETENSORS_FRAMEWORK=pytorch
-          python3 -m pytest -xvs test_fastsafetensors.py::test_device
-          python3 -m pytest -xvs test_fastsafetensors.py::test_framework
-
   collect-wheels:
     name: Collect all ROCm wheels
-    needs: test-rocm-wheels
+    needs: build-rocm-wheels
     runs-on: ubuntu-latest
 
     steps:

From ab00395e20afc52170631f119a6724ea514a8b3e Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 20:07:24 +0000
Subject: [PATCH 14/48] upgrade ubuntu version, skip tests

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index ad043b8..54865c9 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -8,7 +8,7 @@ jobs:
     name: Build ROCm wheel - Python ${{ matrix.python-version }}
     runs-on: ubuntu-latest
     container:
-      image: rocm/dev-ubuntu-22.04:7.0
+      image: rocm/dev-ubuntu-24.04:7.0
       options: --user root
     strategy:
       fail-fast: false
@@ -44,7 +44,7 @@ jobs:
           export DEBIAN_FRONTEND=noninteractive
           export TZ=Etc/UTC
 
-          # Install Python from deadsnakes PPA for Ubuntu 22.04
+          # Install Python from deadsnakes PPA for Ubuntu 24.04
           add-apt-repository -y ppa:deadsnakes/ppa
           apt-get update
 

From 9a11ce3f38d8616b1c2955c9fdff197a4e4b0c94 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 20:55:46 +0000
Subject: [PATCH 15/48] install from python from offical source

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 53 +++++++++++++++++++-----
 1 file changed, 42 insertions(+), 11 deletions(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index 54865c9..f50a814 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -44,23 +44,54 @@ jobs:
           export DEBIAN_FRONTEND=noninteractive
           export TZ=Etc/UTC
 
-          # Install Python from deadsnakes PPA for Ubuntu 24.04
-          add-apt-repository -y ppa:deadsnakes/ppa
-          apt-get update
-
-          # Install specific Python version and dev packages
           PY_VER="${{ matrix.python-version }}"
-          apt-get install -y \
-            python${PY_VER} \
-            python${PY_VER}-dev \
-            python${PY_VER}-distutils || true
+
+          # Try to install from Ubuntu's official repositories first
+          apt-get update
+          if apt-cache show python${PY_VER} 2>/dev/null; then
+            echo "Installing Python ${PY_VER} from Ubuntu repositories"
+            apt-get install -y \
+              python${PY_VER} \
+              python${PY_VER}-dev \
+              python${PY_VER}-venv
+          else
+            # If not available in Ubuntu repos, install using pyenv
+            echo "Python ${PY_VER} not in Ubuntu repos, installing via pyenv from python.org"
+
+            # Install pyenv dependencies
+            apt-get install -y \
+              libssl-dev \
+              zlib1g-dev \
+              libbz2-dev \
+              libreadline-dev \
+              libsqlite3-dev \
+              libncursesw5-dev \
+              xz-utils \
+              tk-dev \
+              libxml2-dev \
+              libxmlsec1-dev \
+              libffi-dev \
+              liblzma-dev
+
+            # Install pyenv
+            export PYENV_ROOT="/root/.pyenv"
+            curl https://pyenv.run | bash
+            export PATH="$PYENV_ROOT/bin:$PATH"
+            eval "$(pyenv init -)"
+
+            # Install Python from official python.org releases
+            pyenv install ${PY_VER}
+            pyenv global ${PY_VER}
+          fi
 
           # Install pip for this Python version
           curl -sS https://bootstrap.pypa.io/get-pip.py | python${PY_VER}
 
           # Create symlink for easier access
-          update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PY_VER} 1
-          update-alternatives --set python3 /usr/bin/python${PY_VER}
+          update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PY_VER} 1 || \
+          ln -sf $(which python${PY_VER}) /usr/bin/python3
+
+          update-alternatives --set python3 /usr/bin/python${PY_VER} 2>/dev/null || true
 
           # Verify installation
           python3 --version

From d6c1f4ac73dec215b24e4093ef0eab0fd61c5f5b Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 21:02:25 +0000
Subject: [PATCH 16/48] use venv instead

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 35 ++++++++++++++----------
 1 file changed, 21 insertions(+), 14 deletions(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index f50a814..67db243 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -84,23 +84,26 @@ jobs:
             pyenv global ${PY_VER}
           fi
 
-          # Install pip for this Python version
-          curl -sS https://bootstrap.pypa.io/get-pip.py | python${PY_VER}
+          # Verify installation
+          python${PY_VER} --version
 
-          # Create symlink for easier access
-          update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PY_VER} 1 || \
-          ln -sf $(which python${PY_VER}) /usr/bin/python3
+      - name: Create virtual environment and install build dependencies
+        run: |
+          PY_VER="${{ matrix.python-version }}"
 
-          update-alternatives --set python3 /usr/bin/python${PY_VER} 2>/dev/null || true
+          # Create virtual environment
+          python${PY_VER} -m venv /opt/venv
 
-          # Verify installation
-          python3 --version
-          python3 -m pip --version
+          # Activate venv and install dependencies
+          . /opt/venv/bin/activate
 
-      - name: Install Python build dependencies
-        run: |
-          python3 -m pip install --upgrade pip setuptools wheel
-          python3 -m pip install build setuptools_scm pybind11 numpy
+          # Upgrade pip and install build tools
+          python -m pip install --upgrade pip setuptools wheel
+          python -m pip install build setuptools_scm pybind11 numpy
+
+          # Verify
+          python --version
+          pip --version
 
       - name: Set ROCm environment variables
         run: |
@@ -108,6 +111,7 @@ jobs:
           echo "HIP_PATH=/opt/rocm/hip" >> $GITHUB_ENV
           echo "/opt/rocm/bin" >> $GITHUB_PATH
           echo "/opt/rocm/hip/bin" >> $GITHUB_PATH
+          echo "/opt/venv/bin" >> $GITHUB_PATH
 
           # Verify ROCm installation
           ls -la /opt/rocm/ || echo "Warning: /opt/rocm not found"
@@ -115,8 +119,11 @@ jobs:
 
       - name: Build wheel for ROCm
         run: |
+          # Activate venv
+          . /opt/venv/bin/activate
+
           # The setup.py should detect ROCm and use hipify-perl automatically
-          python3 -m pip wheel . -w wheelhouse/ --no-deps -v
+          python -m pip wheel . -w wheelhouse/ --no-deps -v
         env:
           ROCM_PATH: /opt/rocm
           HIP_PATH: /opt/rocm/hip

From 5d243830d10e8d275722190139e877de9ff0e070 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 21:18:24 +0000
Subject: [PATCH 17/48] fix other python ci build

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 9 +++++++--
 1 file changed, 7 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index 67db243..a3c85bd 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -46,9 +46,9 @@ jobs:
 
           PY_VER="${{ matrix.python-version }}"
 
-          # Try to install from Ubuntu's official repositories first
+          # Check if Python dev package is available in Ubuntu repos
           apt-get update
-          if apt-cache show python${PY_VER} 2>/dev/null; then
+          if apt-cache show python${PY_VER}-dev 2>/dev/null | grep -q "Package: python${PY_VER}-dev"; then
             echo "Installing Python ${PY_VER} from Ubuntu repositories"
             apt-get install -y \
               python${PY_VER} \
@@ -82,6 +82,11 @@ jobs:
             # Install Python from official python.org releases
             pyenv install ${PY_VER}
             pyenv global ${PY_VER}
+
+            # Create symlink so python${PY_VER} command works
+            INSTALLED_VERSION=$(ls /root/.pyenv/versions/ | grep "^${PY_VER}")
+            ln -sf /root/.pyenv/versions/${INSTALLED_VERSION}/bin/python /usr/local/bin/python${PY_VER}
+            echo "Created symlink: /usr/local/bin/python${PY_VER} -> /root/.pyenv/versions/${INSTALLED_VERSION}/bin/python"
           fi
 
           # Verify installation

From 5eba4b5d15bc5fc3a86d8b46fcb81508999adcd7 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 22:13:33 +0000
Subject: [PATCH 18/48] build many linux

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 33 ++++++++++++++++++++----
 1 file changed, 28 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index a3c85bd..a48ce87 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -104,7 +104,7 @@ jobs:
 
           # Upgrade pip and install build tools
           python -m pip install --upgrade pip setuptools wheel
-          python -m pip install build setuptools_scm pybind11 numpy
+          python -m pip install build setuptools_scm pybind11 numpy auditwheel
 
           # Verify
           python --version
@@ -137,15 +137,38 @@ jobs:
         run: |
           ls -lah wheelhouse/
 
+      - name: Repair wheel with auditwheel to create manylinux wheel
+        run: |
+          # Activate venv
+          . /opt/venv/bin/activate
+
+          # Use auditwheel to repair and convert to manylinux wheel
+          mkdir -p wheelhouse_repaired
+          for wheel in wheelhouse/*.whl; do
+            echo "Repairing wheel: $wheel"
+            auditwheel repair "$wheel" -w wheelhouse_repaired/ || {
+              echo "auditwheel repair failed, copying original wheel"
+              cp "$wheel" wheelhouse_repaired/
+            }
+          done
+
+          # Replace original wheelhouse with repaired wheels
+          rm -rf wheelhouse
+          mv wheelhouse_repaired wheelhouse
+
+          echo "Repaired wheels:"
+          ls -lah wheelhouse/
+
       - name: Rename wheel to include rocm tag
         run: |
           cd wheelhouse
           for wheel in *.whl; do
             if [ -f "$wheel" ]; then
-              # Rename to include rocm tag before platform
-              # e.g., fastsafetensors-X.Y.Z-cp39-cp39-linux_x86_64.whl
-              # becomes fastsafetensors-X.Y.Z-cp39-cp39-rocm_linux_x86_64.whl
-              NEW_NAME=$(echo "$wheel" | sed "s/-linux_/-rocm_linux_/")
+              # Rename to include rocm tag before manylinux/linux platform
+              # e.g., fastsafetensors-X.Y.Z-cp39-cp39-manylinux_2_27_x86_64.whl
+              # becomes fastsafetensors-X.Y.Z-cp39-cp39-rocm_manylinux_2_27_x86_64.whl
+              # Also handles: linux_x86_64 -> rocm_linux_x86_64
+              NEW_NAME=$(echo "$wheel" | sed -E "s/-(manylinux|linux)_/-rocm_\1_/")
 
               if [ "$wheel" != "$NEW_NAME" ]; then
                 mv "$wheel" "$NEW_NAME"

From c543e162152f6d6763c233f2a184bdae9083993b Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 22:24:40 +0000
Subject: [PATCH 19/48] remove rocm_ tag from platform tag

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 19 -------------------
 1 file changed, 19 deletions(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index a48ce87..80e5ed4 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -159,25 +159,6 @@ jobs:
           echo "Repaired wheels:"
           ls -lah wheelhouse/
 
-      - name: Rename wheel to include rocm tag
-        run: |
-          cd wheelhouse
-          for wheel in *.whl; do
-            if [ -f "$wheel" ]; then
-              # Rename to include rocm tag before manylinux/linux platform
-              # e.g., fastsafetensors-X.Y.Z-cp39-cp39-manylinux_2_27_x86_64.whl
-              # becomes fastsafetensors-X.Y.Z-cp39-cp39-rocm_manylinux_2_27_x86_64.whl
-              # Also handles: linux_x86_64 -> rocm_linux_x86_64
-              NEW_NAME=$(echo "$wheel" | sed -E "s/-(manylinux|linux)_/-rocm_\1_/")
-
-              if [ "$wheel" != "$NEW_NAME" ]; then
-                mv "$wheel" "$NEW_NAME"
-                echo "Renamed: $wheel -> $NEW_NAME"
-              fi
-            fi
-          done
-          ls -lah
-
       - name: Upload wheel artifact
         uses: actions/upload-artifact@v4
         with:

From 8ea1956fdbfef0007c614b8396bbaedb671441dd Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 23:30:11 +0000
Subject: [PATCH 20/48] Add automated PyPI index with separate CUDA/ROCm
 backends

  - Add script to auto-generate PyPI-compatible index from GitHub releases
  - Create separate indexes for CUDA and ROCm wheels based on release tags
  - Add GitHub Actions workflow to deploy indexes to GitHub Pages
  - Generate landing page with installation instructions
  - Ignore auto-generated pypi-index directory

  Indexes will be available at:
  - ROCm: https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/
  - CUDA: https://embeddedllm.github.io/fastsafetensors-rocm/cuda/simple/

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/scripts/generate_pypi_index.py   | 228 +++++++++++++++++++++++
 .github/workflows/deploy-pypi-index.yaml |  53 ++++++
 .gitignore                               |   5 +-
 3 files changed, 285 insertions(+), 1 deletion(-)
 create mode 100755 .github/scripts/generate_pypi_index.py
 create mode 100644 .github/workflows/deploy-pypi-index.yaml

diff --git a/.github/scripts/generate_pypi_index.py b/.github/scripts/generate_pypi_index.py
new file mode 100755
index 0000000..eb360d9
--- /dev/null
+++ b/.github/scripts/generate_pypi_index.py
@@ -0,0 +1,228 @@
+#!/usr/bin/env python3
+"""
+Generate PyPI-compatible simple index from GitHub releases.
+This script fetches all releases and creates separate indexes for CUDA and ROCm wheels.
+"""
+
+import json
+import os
+import sys
+from pathlib import Path
+from urllib.request import urlopen, Request
+
+def fetch_releases(repo_owner, repo_name):
+    """Fetch all releases from GitHub API."""
+    url = f"https://api.github.com/repos/{repo_owner}/{repo_name}/releases"
+    headers = {
+        "Accept": "application/vnd.github.v3+json",
+        "User-Agent": "PyPI-Index-Generator"
+    }
+
+    # Add GitHub token if available (for higher rate limits)
+    token = os.environ.get("GITHUB_TOKEN")
+    if token:
+        headers["Authorization"] = f"token {token}"
+
+    request = Request(url, headers=headers)
+
+    try:
+        with urlopen(request) as response:
+            return json.loads(response.read().decode())
+    except Exception as e:
+        print(f"Error fetching releases: {e}", file=sys.stderr)
+        sys.exit(1)
+
+def categorize_backend(release_tag):
+    """Determine backend (cuda/rocm) from release tag."""
+    tag_lower = release_tag.lower()
+
+    if "rocm" in tag_lower:
+        return "rocm"
+    elif "cuda" in tag_lower:
+        return "cuda"
+    else:
+        # Default to cuda for untagged releases
+        return "cuda"
+
+def extract_wheels_by_backend(releases):
+    """Extract wheel files from releases, categorized by backend."""
+    wheels_by_backend = {
+        "cuda": [],
+        "rocm": []
+    }
+
+    for release in releases:
+        backend = categorize_backend(release.get("tag_name", ""))
+
+        for asset in release.get("assets", []):
+            name = asset.get("name", "")
+            if name.endswith(".whl"):
+                wheels_by_backend[backend].append({
+                    "name": name,
+                    "url": asset.get("browser_download_url"),
+                    "version": release.get("tag_name"),
+                })
+
+    return wheels_by_backend
+
+def generate_root_index(output_dir, packages):
+    """Generate the root simple index."""
+    html = """<!DOCTYPE html>
+<html>
+<head>
+    <meta charset="UTF-8">
+    <title>Simple Index</title>
+</head>
+<body>
+    <h1>Simple Index</h1>
+"""
+
+    for package in sorted(packages):
+        html += f'    <a href="{package}/">{package}</a><br/>\n'
+
+    html += """</body>
+</html>
+"""
+
+    output_path = output_dir / "index.html"
+    output_path.write_text(html)
+    print(f"Generated: {output_path}")
+
+def generate_package_index(output_dir, package_name, wheels):
+    """Generate package-specific index with all wheels."""
+    html = f"""<!DOCTYPE html>
+<html>
+<head>
+    <meta charset="UTF-8">
+    <title>Links for {package_name}</title>
+</head>
+<body>
+    <h1>Links for {package_name}</h1>
+"""
+
+    # Sort wheels by version and Python version
+    sorted_wheels = sorted(wheels, key=lambda w: (w["name"], w["version"]), reverse=True)
+
+    for wheel in sorted_wheels:
+        # Extract package name from wheel filename to ensure consistency
+        wheel_name = wheel["name"]
+        url = wheel["url"]
+        html += f'    <a href="{url}#sha256=">{wheel_name}</a><br/>\n'
+
+    html += """</body>
+</html>
+"""
+
+    package_dir = output_dir / package_name
+    package_dir.mkdir(parents=True, exist_ok=True)
+
+    output_path = package_dir / "index.html"
+    output_path.write_text(html)
+    print(f"Generated: {output_path}")
+
+def generate_landing_page(base_dir, repo_name):
+    """Generate a landing page for the PyPI index."""
+    html = f"""<!DOCTYPE html>
+<html>
+<head>
+    <meta charset="UTF-8">
+    <title>{repo_name} - PyPI Index</title>
+    <style>
+        body {{ font-family: system-ui, -apple-system, sans-serif; max-width: 800px; margin: 50px auto; padding: 20px; }}
+        h1 {{ color: #2c3e50; }}
+        .backend {{ margin: 30px 0; padding: 20px; background: #f8f9fa; border-radius: 8px; }}
+        code {{ background: #e9ecef; padding: 2px 6px; border-radius: 4px; font-size: 0.9em; }}
+        pre {{ background: #2c3e50; color: #ecf0f1; padding: 15px; border-radius: 6px; overflow-x: auto; }}
+    </style>
+</head>
+<body>
+    <h1>{repo_name} - PyPI Index</h1>
+    <p>Choose the appropriate index URL based on your GPU backend:</p>
+
+    <div class="backend">
+        <h2>🔥 ROCm (AMD GPUs)</h2>
+        <p>For AMD GPUs using ROCm:</p>
+        <pre>pip install fastsafetensors --index-url https://embeddedllm.github.io/{repo_name}/rocm/simple/</pre>
+    </div>
+
+    <div class="backend">
+        <h2>💚 CUDA (NVIDIA GPUs)</h2>
+        <p>For NVIDIA GPUs using CUDA:</p>
+        <pre>pip install fastsafetensors --index-url https://embeddedllm.github.io/{repo_name}/cuda/simple/</pre>
+    </div>
+
+    <h3>Version Specific Installation</h3>
+    <pre>pip install fastsafetensors==0.1.15 --index-url https://embeddedllm.github.io/{repo_name}/rocm/simple/</pre>
+
+    <h3>In requirements.txt</h3>
+    <pre>--index-url https://embeddedllm.github.io/{repo_name}/rocm/simple/
+fastsafetensors>=0.1.15</pre>
+
+    <hr>
+    <p><small>Direct access: <a href="rocm/simple/">ROCm Index</a> | <a href="cuda/simple/">CUDA Index</a></small></p>
+</body>
+</html>
+"""
+
+    output_path = base_dir / "index.html"
+    output_path.write_text(html)
+    print(f"Generated landing page: {output_path}")
+
+def main():
+    # Configuration
+    repo_owner = os.environ.get("GITHUB_REPOSITORY_OWNER", "EmbeddedLLM")
+    repo_full = os.environ.get("GITHUB_REPOSITORY", "EmbeddedLLM/fastsafetensors-rocm")
+    repo_name = repo_full.split("/")[-1]
+
+    print(f"Fetching releases from {repo_owner}/{repo_name}...")
+    releases = fetch_releases(repo_owner, repo_name)
+    print(f"Found {len(releases)} releases")
+
+    # Extract wheels categorized by backend
+    wheels_by_backend = extract_wheels_by_backend(releases)
+
+    total_wheels = sum(len(wheels) for wheels in wheels_by_backend.values())
+    print(f"Found {total_wheels} total wheel files")
+    print(f"  CUDA: {len(wheels_by_backend['cuda'])} wheels")
+    print(f"  ROCm: {len(wheels_by_backend['rocm'])} wheels")
+
+    if total_wheels == 0:
+        print("Warning: No wheel files found in any release", file=sys.stderr)
+        return
+
+    # Generate indexes for each backend
+    for backend, wheels in wheels_by_backend.items():
+        if not wheels:
+            print(f"Skipping {backend} index (no wheels found)")
+            continue
+
+        print(f"\nGenerating {backend.upper()} index...")
+        output_dir = Path(f"pypi-index/{backend}/simple")
+        output_dir.mkdir(parents=True, exist_ok=True)
+
+        # Group wheels by package name
+        packages = {}
+        for wheel in wheels:
+            # Extract package name from wheel filename (before first dash)
+            package_name = wheel["name"].split("-")[0]
+            if package_name not in packages:
+                packages[package_name] = []
+            packages[package_name].append(wheel)
+
+        # Generate indexes
+        generate_root_index(output_dir, packages.keys())
+
+        for package_name, package_wheels in packages.items():
+            generate_package_index(output_dir, package_name, package_wheels)
+
+        print(f"  Generated {backend.upper()} index with {len(packages)} package(s)")
+
+    # Generate landing page
+    base_dir = Path("pypi-index")
+    generate_landing_page(base_dir, repo_name)
+
+    print(f"\n✓ Successfully generated indexes for all backends")
+    print(f"  Total wheels: {total_wheels}")
+
+if __name__ == "__main__":
+    main()
diff --git a/.github/workflows/deploy-pypi-index.yaml b/.github/workflows/deploy-pypi-index.yaml
new file mode 100644
index 0000000..7eefa04
--- /dev/null
+++ b/.github/workflows/deploy-pypi-index.yaml
@@ -0,0 +1,53 @@
+name: Deploy PyPI Index to GitHub Pages
+
+on:
+  release:
+    types: [published]
+  workflow_dispatch:
+
+permissions:
+  contents: read
+  pages: write
+  id-token: write
+
+concurrency:
+  group: "pages"
+  cancel-in-progress: false
+
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: '3.11'
+
+      - name: Generate PyPI index from releases
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+        run: |
+          chmod +x .github/scripts/generate_pypi_index.py
+          python .github/scripts/generate_pypi_index.py
+
+      - name: Setup Pages
+        uses: actions/configure-pages@v4
+
+      - name: Upload artifact
+        uses: actions/upload-pages-artifact@v3
+        with:
+          path: ./pypi-index
+
+  deploy:
+    environment:
+      name: github-pages
+      url: ${{ steps.deployment.outputs.page_url }}
+    runs-on: ubuntu-latest
+    needs: build
+    steps:
+      - name: Deploy to GitHub Pages
+        id: deployment
+        uses: actions/deploy-pages@v4
diff --git a/.gitignore b/.gitignore
index cbe6914..0660f62 100644
--- a/.gitignore
+++ b/.gitignore
@@ -15,4 +15,7 @@ examples/paddle_case/log
 # Auto-generated hipified files and directories (created during ROCm build)
 fastsafetensors/cpp/hip/
 fastsafetensors/cpp/*.hip.*
-fastsafetensors/cpp/hip_compat.h
\ No newline at end of file
+fastsafetensors/cpp/hip_compat.h
+
+# Auto-generated PyPI index (generated by GitHub Actions)
+pypi-index/
\ No newline at end of file

From f6101fc621d6e9f2e93fe45acf4dda90378d5e5c Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Thu, 6 Nov 2025 23:47:20 +0000
Subject: [PATCH 21/48] only manual trigger when deploying pypi index

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/deploy-pypi-index.yaml | 2 --
 1 file changed, 2 deletions(-)

diff --git a/.github/workflows/deploy-pypi-index.yaml b/.github/workflows/deploy-pypi-index.yaml
index 7eefa04..e56efb8 100644
--- a/.github/workflows/deploy-pypi-index.yaml
+++ b/.github/workflows/deploy-pypi-index.yaml
@@ -1,8 +1,6 @@
 name: Deploy PyPI Index to GitHub Pages
 
 on:
-  release:
-    types: [published]
   workflow_dispatch:
 
 permissions:

From 643d12d209ed4a04bdb7e3eecc6b20068cda2821 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 01:01:52 +0000
Subject: [PATCH 22/48] add publish to index GA workflow

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 198 ++++++++++++++++++++++++
 1 file changed, 198 insertions(+)
 create mode 100644 .github/workflows/publish-to-index.yaml

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
new file mode 100644
index 0000000..ebb5a29
--- /dev/null
+++ b/.github/workflows/publish-to-index.yaml
@@ -0,0 +1,198 @@
+name: Publish ROCm wheels to custom index
+
+on:
+  workflow_dispatch:
+    inputs:
+      version:
+        description: 'Version to publish (e.g., v0.1.15-rocm)'
+        required: true
+  release:
+    types: [published]
+
+permissions:
+  contents: read
+
+jobs:
+  publish-to-github-pages:
+    name: Publish to GitHub Pages index
+    runs-on: ubuntu-latest
+
+    steps:
+      - name: Checkout fastsafetensors-rocm repo
+        uses: actions/checkout@v4
+        with:
+          path: fastsafetensors-rocm
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: "3.12"
+
+      - name: Install tools
+        run: |
+          python -m pip install --upgrade pip
+          pip install dumb-pypi
+
+      - name: Download ROCm wheels from release
+        env:
+          GH_TOKEN: ${{ github.token }}
+        run: |
+          # Determine version
+          if [ "${{ github.event_name }}" = "release" ]; then
+            VERSION="${{ github.event.release.tag_name }}"
+          else
+            VERSION="${{ github.event.inputs.version }}"
+          fi
+
+          echo "Downloading wheels for ${VERSION}"
+
+          # Create directory for wheels
+          mkdir -p wheels/rocm
+
+          # Download release assets (wheels) using gh CLI
+          cd wheels/rocm
+          gh release download "${VERSION}" \
+            --repo EmbeddedLLM/fastsafetensors-rocm \
+            --pattern "*.whl"
+
+          ls -lah
+
+      - name: Download all dependencies
+        run: |
+          # Create temporary directory for dependency resolution
+          mkdir -p deps_temp
+
+          # For each Python version, download dependencies
+          for py_ver in 3.9 3.10 3.11 3.12 3.13; do
+            echo "Downloading dependencies for Python ${py_ver}"
+
+            # Create a venv for this Python version to resolve dependencies
+            python${py_ver} -m venv deps_temp/venv${py_ver} 2>/dev/null || {
+              echo "Python ${py_ver} not available, skipping"
+              continue
+            }
+
+            source deps_temp/venv${py_ver}/bin/activate
+            pip install --upgrade pip
+
+            # Download dependencies for fastsafetensors (without fastsafetensors itself)
+            # This gets typer and all of typer's dependencies
+            pip download \
+              --dest wheels/rocm \
+              --only-binary :all: \
+              --python-version ${py_ver} \
+              --platform manylinux2014_x86_64 \
+              --platform manylinux_2_17_x86_64 \
+              --platform manylinux_2_27_x86_64 \
+              --platform manylinux_2_28_x86_64 \
+              typer || echo "Failed to download for Python ${py_ver}"
+
+            deactivate
+          done
+
+          # Also download using current Python for any missing wheels
+          pip download \
+            --dest wheels/rocm \
+            --only-binary :all: \
+            typer
+
+          # Remove duplicates and list what we have
+          cd wheels/rocm
+          # Remove duplicate wheels (keep latest version)
+          # This is a simple deduplication - you might want more sophisticated logic
+          ls -1 *.whl | sort | uniq
+
+          echo "Total wheels collected:"
+          ls -1 *.whl | wc -l
+
+          echo "Wheel breakdown by package:"
+          ls -1 *.whl | sed 's/-[0-9].*//' | sort | uniq -c
+
+      - name: Checkout GitHub Pages repository
+        uses: actions/checkout@v4
+        with:
+          repository: EmbeddedLLM/fastsafetensors-rocm
+          ref: gh-pages
+          token: ${{ secrets.GITHUB_TOKEN }}
+          path: gh-pages-repo
+
+      - name: Copy wheels and generate index
+        run: |
+          cd gh-pages-repo
+
+          # Create directory structure
+          mkdir -p rocm/packages
+
+          # Copy all wheels
+          cp ../wheels/rocm/*.whl rocm/packages/
+
+          # Generate package list
+          ls rocm/packages/*.whl > rocm/package-list.txt
+
+          # Generate PEP 503 compliant index
+          dumb-pypi \
+            --package-list rocm/package-list.txt \
+            --packages-url ../packages \
+            --output-dir rocm/simple \
+            --title "fastsafetensors ROCm Index"
+
+          echo "Generated index for $(ls rocm/packages/*.whl | wc -l) wheels"
+
+      - name: Create index README
+        run: |
+          cd gh-pages-repo
+
+          cat > rocm/README.md << 'EOF'
+          # fastsafetensors ROCm Package Index
+
+          This is a custom Python package index for ROCm-built fastsafetensors wheels.
+
+          ## Installation
+
+          ```bash
+          # Install fastsafetensors with ROCm support
+          pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/
+          ```
+
+          ## Available Packages
+
+          This index includes:
+          - `fastsafetensors` - ROCm builds for Python 3.9-3.13
+          - All dependencies (typer, click, etc.) for multiple Python versions and platforms
+
+          ## What's Included
+
+          EOF
+
+          # List packages with counts
+          echo "### Package Inventory" >> rocm/README.md
+          echo "" >> rocm/README.md
+          ls rocm/packages/*.whl | sed 's/.*\///' | sed 's/-[0-9].*//' | sort | uniq -c | awk '{print "- " $2 ": " $1 " wheels"}' >> rocm/README.md
+
+      - name: Commit and push to gh-pages
+        run: |
+          cd gh-pages-repo
+
+          git config user.name "GitHub Actions"
+          git config user.email "actions@github.com"
+
+          git add rocm/
+
+          if git diff --staged --quiet; then
+            echo "No changes to commit"
+          else
+            git commit -m "Update ROCm index - $(date +%Y-%m-%d)"
+            git push
+            echo "Successfully pushed to gh-pages branch"
+          fi
+
+      - name: Summary
+        run: |
+          echo "## Published to GitHub Pages! 🎉" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+          echo "Index URL: https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+          echo "### Installation" >> $GITHUB_STEP_SUMMARY
+          echo '```bash' >> $GITHUB_STEP_SUMMARY
+          echo "pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/" >> $GITHUB_STEP_SUMMARY
+          echo '```' >> $GITHUB_STEP_SUMMARY

From 0935d8c93688ae2f7f3a1712d66ec6736588fd61 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 01:18:29 +0000
Subject: [PATCH 23/48] fix the publish to index

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 307 ++++++++++++++++--------
 1 file changed, 212 insertions(+), 95 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index ebb5a29..610d62c 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -1,11 +1,20 @@
-name: Publish ROCm wheels to custom index
+name: Publish wheels to custom index
 
 on:
   workflow_dispatch:
     inputs:
       version:
-        description: 'Version to publish (e.g., v0.1.15-rocm)'
+        description: 'Version to publish (e.g., v0.1.15-rocm or v0.1.15-cuda)'
         required: true
+      platform:
+        description: 'Platform to publish (rocm, cuda, or both)'
+        required: true
+        default: 'rocm'
+        type: choice
+        options:
+          - rocm
+          - cuda
+          - both
   release:
     types: [published]
 
@@ -33,9 +42,8 @@ jobs:
           python -m pip install --upgrade pip
           pip install dumb-pypi
 
-      - name: Download ROCm wheels from release
-        env:
-          GH_TOKEN: ${{ github.token }}
+      - name: Determine platform and version
+        id: determine
         run: |
           # Determine version
           if [ "${{ github.event_name }}" = "release" ]; then
@@ -43,70 +51,106 @@ jobs:
           else
             VERSION="${{ github.event.inputs.version }}"
           fi
+          echo "version=${VERSION}" >> $GITHUB_OUTPUT
 
-          echo "Downloading wheels for ${VERSION}"
+          # Determine platform from version tag or input
+          if [ "${{ github.event_name }}" = "release" ]; then
+            if [[ "${VERSION}" == *"rocm"* ]]; then
+              PLATFORM="rocm"
+            elif [[ "${VERSION}" == *"cuda"* ]]; then
+              PLATFORM="cuda"
+            else
+              PLATFORM="both"
+            fi
+          else
+            PLATFORM="${{ github.event.inputs.platform }}"
+          fi
+          echo "platform=${PLATFORM}" >> $GITHUB_OUTPUT
 
-          # Create directory for wheels
-          mkdir -p wheels/rocm
+          echo "Publishing version: ${VERSION}"
+          echo "Platform: ${PLATFORM}"
 
-          # Download release assets (wheels) using gh CLI
-          cd wheels/rocm
-          gh release download "${VERSION}" \
-            --repo EmbeddedLLM/fastsafetensors-rocm \
-            --pattern "*.whl"
+      - name: Download wheels from release
+        env:
+          GH_TOKEN: ${{ github.token }}
+        run: |
+          VERSION="${{ steps.determine.outputs.version }}"
+          PLATFORM="${{ steps.determine.outputs.platform }}"
+
+          # Create directories
+          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
+            mkdir -p wheels/rocm
+            echo "Downloading ROCm wheels for ${VERSION}"
+            cd wheels/rocm
+            gh release download "${VERSION}" \
+              --repo EmbeddedLLM/fastsafetensors-rocm \
+              --pattern "*.whl" || echo "No ROCm wheels found"
+            ls -lah
+            cd ../..
+          fi
 
-          ls -lah
+          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
+            mkdir -p wheels/cuda
+            echo "Downloading CUDA wheels for ${VERSION}"
+            cd wheels/cuda
+            gh release download "${VERSION}" \
+              --repo EmbeddedLLM/fastsafetensors-rocm \
+              --pattern "*.whl" || echo "No CUDA wheels found"
+            ls -lah
+            cd ../..
+          fi
 
       - name: Download all dependencies
         run: |
-          # Create temporary directory for dependency resolution
-          mkdir -p deps_temp
-
-          # For each Python version, download dependencies
-          for py_ver in 3.9 3.10 3.11 3.12 3.13; do
-            echo "Downloading dependencies for Python ${py_ver}"
-
-            # Create a venv for this Python version to resolve dependencies
-            python${py_ver} -m venv deps_temp/venv${py_ver} 2>/dev/null || {
-              echo "Python ${py_ver} not available, skipping"
-              continue
-            }
-
-            source deps_temp/venv${py_ver}/bin/activate
-            pip install --upgrade pip
-
-            # Download dependencies for fastsafetensors (without fastsafetensors itself)
-            # This gets typer and all of typer's dependencies
-            pip download \
-              --dest wheels/rocm \
+          PLATFORM="${{ steps.determine.outputs.platform }}"
+
+          # Function to download dependencies for a platform
+          download_deps() {
+            local platform=$1
+            local dest_dir="wheels/${platform}"
+
+            echo "Downloading dependencies for ${platform}..."
+
+            # For each Python version, download dependencies
+            for py_ver in 3.9 3.10 3.11 3.12 3.13; do
+              echo "Downloading dependencies for Python ${py_ver}"
+
+              # Download dependencies using current Python (pip handles version compatibility)
+              python -m pip download \
+                --dest "${dest_dir}" \
+                --only-binary :all: \
+                --python-version ${py_ver} \
+                --platform manylinux2014_x86_64 \
+                --platform manylinux_2_17_x86_64 \
+                --platform manylinux_2_27_x86_64 \
+                --platform manylinux_2_28_x86_64 \
+                typer 2>/dev/null || echo "Some downloads failed for Python ${py_ver}"
+            done
+
+            # Also download using current Python for any missing wheels
+            python -m pip download \
+              --dest "${dest_dir}" \
               --only-binary :all: \
-              --python-version ${py_ver} \
-              --platform manylinux2014_x86_64 \
-              --platform manylinux_2_17_x86_64 \
-              --platform manylinux_2_27_x86_64 \
-              --platform manylinux_2_28_x86_64 \
-              typer || echo "Failed to download for Python ${py_ver}"
-
-            deactivate
-          done
-
-          # Also download using current Python for any missing wheels
-          pip download \
-            --dest wheels/rocm \
-            --only-binary :all: \
-            typer
-
-          # Remove duplicates and list what we have
-          cd wheels/rocm
-          # Remove duplicate wheels (keep latest version)
-          # This is a simple deduplication - you might want more sophisticated logic
-          ls -1 *.whl | sort | uniq
-
-          echo "Total wheels collected:"
-          ls -1 *.whl | wc -l
-
-          echo "Wheel breakdown by package:"
-          ls -1 *.whl | sed 's/-[0-9].*//' | sort | uniq -c
+              typer || true
+
+            # Summary
+            if [ -d "${dest_dir}" ] && [ "$(ls -A ${dest_dir}/*.whl 2>/dev/null)" ]; then
+              echo "Total wheels collected for ${platform}:"
+              ls -1 "${dest_dir}"/*.whl | wc -l
+
+              echo "Wheel breakdown by package:"
+              ls -1 "${dest_dir}"/*.whl | xargs -n1 basename | sed 's/-[0-9].*//' | sort | uniq -c
+            fi
+          }
+
+          # Download for requested platforms
+          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
+            download_deps "rocm"
+          fi
+
+          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
+            download_deps "cuda"
+          fi
 
       - name: Checkout GitHub Pages repository
         uses: actions/checkout@v4
@@ -119,80 +163,153 @@ jobs:
       - name: Copy wheels and generate index
         run: |
           cd gh-pages-repo
+          PLATFORM="${{ steps.determine.outputs.platform }}"
+
+          # Function to generate index for a platform
+          generate_index() {
+            local platform=$1
+
+            echo "Generating index for ${platform}..."
 
-          # Create directory structure
-          mkdir -p rocm/packages
+            # Create directory structure
+            mkdir -p "${platform}/packages"
 
-          # Copy all wheels
-          cp ../wheels/rocm/*.whl rocm/packages/
+            # Copy all wheels
+            if [ -d "../wheels/${platform}" ] && [ "$(ls -A ../wheels/${platform}/*.whl 2>/dev/null)" ]; then
+              cp ../wheels/${platform}/*.whl "${platform}/packages/"
 
-          # Generate package list
-          ls rocm/packages/*.whl > rocm/package-list.txt
+              # Generate package list
+              ls "${platform}/packages"/*.whl > "${platform}/package-list.txt"
 
-          # Generate PEP 503 compliant index
-          dumb-pypi \
-            --package-list rocm/package-list.txt \
-            --packages-url ../packages \
-            --output-dir rocm/simple \
-            --title "fastsafetensors ROCm Index"
+              # Generate PEP 503 compliant index
+              dumb-pypi \
+                --package-list "${platform}/package-list.txt" \
+                --packages-url ../packages \
+                --output-dir "${platform}/simple" \
+                --title "fastsafetensors ${platform^^} Index"
 
-          echo "Generated index for $(ls rocm/packages/*.whl | wc -l) wheels"
+              echo "Generated ${platform} index for $(ls ${platform}/packages/*.whl | wc -l) wheels"
+            else
+              echo "No wheels found for ${platform}, skipping index generation"
+            fi
+          }
 
-      - name: Create index README
+          # Generate for requested platforms
+          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
+            generate_index "rocm"
+          fi
+
+          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
+            generate_index "cuda"
+          fi
+
+      - name: Create index READMEs
         run: |
           cd gh-pages-repo
+          PLATFORM="${{ steps.determine.outputs.platform }}"
+
+          # Function to create README for a platform
+          create_readme() {
+            local platform=$1
+            local platform_upper=$(echo $platform | tr '[:lower:]' '[:upper:]')
 
-          cat > rocm/README.md << 'EOF'
-          # fastsafetensors ROCm Package Index
+            if [ ! -d "${platform}/packages" ] || [ ! "$(ls -A ${platform}/packages/*.whl 2>/dev/null)" ]; then
+              echo "No packages for ${platform}, skipping README"
+              return
+            fi
 
-          This is a custom Python package index for ROCm-built fastsafetensors wheels.
+            cat > "${platform}/README.md" << EOF
+          # fastsafetensors ${platform_upper} Package Index
+
+          This is a custom Python package index for ${platform_upper}-built fastsafetensors wheels.
 
           ## Installation
 
-          ```bash
-          # Install fastsafetensors with ROCm support
-          pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/
-          ```
+          \`\`\`bash
+          # Install fastsafetensors with ${platform_upper} support
+          pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/${platform}/simple/
+          \`\`\`
 
           ## Available Packages
 
           This index includes:
-          - `fastsafetensors` - ROCm builds for Python 3.9-3.13
+          - \`fastsafetensors\` - ${platform_upper} builds for Python 3.9-3.13
           - All dependencies (typer, click, etc.) for multiple Python versions and platforms
 
           ## What's Included
 
           EOF
 
-          # List packages with counts
-          echo "### Package Inventory" >> rocm/README.md
-          echo "" >> rocm/README.md
-          ls rocm/packages/*.whl | sed 's/.*\///' | sed 's/-[0-9].*//' | sort | uniq -c | awk '{print "- " $2 ": " $1 " wheels"}' >> rocm/README.md
+            # List packages with counts
+            echo "### Package Inventory" >> "${platform}/README.md"
+            echo "" >> "${platform}/README.md"
+            ls "${platform}/packages"/*.whl | sed 's/.*\///' | sed 's/-[0-9].*//' | sort | uniq -c | awk '{print "- " $2 ": " $1 " wheels"}' >> "${platform}/README.md"
+          }
+
+          # Create READMEs for requested platforms
+          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
+            create_readme "rocm"
+          fi
+
+          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
+            create_readme "cuda"
+          fi
 
       - name: Commit and push to gh-pages
         run: |
           cd gh-pages-repo
+          PLATFORM="${{ steps.determine.outputs.platform }}"
 
           git config user.name "GitHub Actions"
           git config user.email "actions@github.com"
 
-          git add rocm/
+          # Add platform directories based on selection
+          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
+            git add rocm/
+          fi
+
+          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
+            git add cuda/
+          fi
 
           if git diff --staged --quiet; then
             echo "No changes to commit"
           else
-            git commit -m "Update ROCm index - $(date +%Y-%m-%d)"
+            if [ "$PLATFORM" = "both" ]; then
+              git commit -m "Update ROCm and CUDA indices - $(date +%Y-%m-%d)"
+            elif [ "$PLATFORM" = "cuda" ]; then
+              git commit -m "Update CUDA index - $(date +%Y-%m-%d)"
+            else
+              git commit -m "Update ROCm index - $(date +%Y-%m-%d)"
+            fi
             git push
             echo "Successfully pushed to gh-pages branch"
           fi
 
       - name: Summary
         run: |
+          PLATFORM="${{ steps.determine.outputs.platform }}"
+
           echo "## Published to GitHub Pages! 🎉" >> $GITHUB_STEP_SUMMARY
           echo "" >> $GITHUB_STEP_SUMMARY
-          echo "Index URL: https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/" >> $GITHUB_STEP_SUMMARY
-          echo "" >> $GITHUB_STEP_SUMMARY
-          echo "### Installation" >> $GITHUB_STEP_SUMMARY
-          echo '```bash' >> $GITHUB_STEP_SUMMARY
-          echo "pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/" >> $GITHUB_STEP_SUMMARY
-          echo '```' >> $GITHUB_STEP_SUMMARY
+
+          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
+            echo "### ROCm Index" >> $GITHUB_STEP_SUMMARY
+            echo "Index URL: https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/" >> $GITHUB_STEP_SUMMARY
+            echo "" >> $GITHUB_STEP_SUMMARY
+            echo "**Installation:**" >> $GITHUB_STEP_SUMMARY
+            echo '```bash' >> $GITHUB_STEP_SUMMARY
+            echo "pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/" >> $GITHUB_STEP_SUMMARY
+            echo '```' >> $GITHUB_STEP_SUMMARY
+            echo "" >> $GITHUB_STEP_SUMMARY
+          fi
+
+          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
+            echo "### CUDA Index" >> $GITHUB_STEP_SUMMARY
+            echo "Index URL: https://embeddedllm.github.io/fastsafetensors-rocm/cuda/simple/" >> $GITHUB_STEP_SUMMARY
+            echo "" >> $GITHUB_STEP_SUMMARY
+            echo "**Installation:**" >> $GITHUB_STEP_SUMMARY
+            echo '```bash' >> $GITHUB_STEP_SUMMARY
+            echo "pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/cuda/simple/" >> $GITHUB_STEP_SUMMARY
+            echo '```' >> $GITHUB_STEP_SUMMARY
+          fi

From 378b262284728b9babecbae37189c19f7d293818 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 01:21:08 +0000
Subject: [PATCH 24/48] fix the publish to index write permission

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 610d62c..86fc93f 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -19,7 +19,7 @@ on:
     types: [published]
 
 permissions:
-  contents: read
+  contents: write
 
 jobs:
   publish-to-github-pages:

From 5efe4a9e23e09b8faca9df9ca9466c3862c15405 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 01:30:37 +0000
Subject: [PATCH 25/48] fix the publish to index for both mode

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 31 +++++++++++++++++++------
 1 file changed, 24 insertions(+), 7 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 86fc93f..b30c8b4 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -77,25 +77,42 @@ jobs:
           VERSION="${{ steps.determine.outputs.version }}"
           PLATFORM="${{ steps.determine.outputs.platform }}"
 
-          # Create directories
+          # Function to construct platform-specific version tag
+          get_version_tag() {
+            local platform=$1
+            local version="${VERSION}"
+
+            # If version already has platform suffix, use as-is
+            if [[ "${version}" == *"-${platform}"* ]]; then
+              echo "${version}"
+            else
+              # Otherwise append platform suffix
+              echo "${version}-${platform}"
+            fi
+          }
+
+          # Download ROCm wheels
           if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
+            ROCM_VERSION=$(get_version_tag "rocm")
             mkdir -p wheels/rocm
-            echo "Downloading ROCm wheels for ${VERSION}"
+            echo "Downloading ROCm wheels from release ${ROCM_VERSION}"
             cd wheels/rocm
-            gh release download "${VERSION}" \
+            gh release download "${ROCM_VERSION}" \
               --repo EmbeddedLLM/fastsafetensors-rocm \
-              --pattern "*.whl" || echo "No ROCm wheels found"
+              --pattern "*.whl" || echo "Warning: No ROCm wheels found for ${ROCM_VERSION}"
             ls -lah
             cd ../..
           fi
 
+          # Download CUDA wheels
           if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
+            CUDA_VERSION=$(get_version_tag "cuda")
             mkdir -p wheels/cuda
-            echo "Downloading CUDA wheels for ${VERSION}"
+            echo "Downloading CUDA wheels from release ${CUDA_VERSION}"
             cd wheels/cuda
-            gh release download "${VERSION}" \
+            gh release download "${CUDA_VERSION}" \
               --repo EmbeddedLLM/fastsafetensors-rocm \
-              --pattern "*.whl" || echo "No CUDA wheels found"
+              --pattern "*.whl" || echo "Warning: No CUDA wheels found for ${CUDA_VERSION}"
             ls -lah
             cd ../..
           fi

From 8871043c722a4583d651921338fdafa4ac3ab624 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 01:41:17 +0000
Subject: [PATCH 26/48] fix the manylinux rocmwheel build

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/build-rocm-wheels.yaml | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
index 80e5ed4..142ee78 100644
--- a/.github/workflows/build-rocm-wheels.yaml
+++ b/.github/workflows/build-rocm-wheels.yaml
@@ -36,7 +36,8 @@ jobs:
             make \
             git \
             curl \
-            ca-certificates
+            ca-certificates \
+            patchelf
 
       - name: Install Python ${{ matrix.python-version }}
         run: |

From 619c531d631c0a7edb2aa72c5045c1224cbe9da1 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 01:49:51 +0000
Subject: [PATCH 27/48] update publish to index

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 24 ++++++++++++++++++++----
 1 file changed, 20 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index b30c8b4..142eb71 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -42,6 +42,14 @@ jobs:
           python -m pip install --upgrade pip
           pip install dumb-pypi
 
+          # Install GitHub CLI
+          type -p curl >/dev/null || (sudo apt update && sudo apt install curl -y)
+          curl -fsSL https://cli.github.com/packages/githubcli-archive-keyring.gpg | sudo dd of=/usr/share/keyrings/githubcli-archive-keyring.gpg \
+          && sudo chmod go+r /usr/share/keyrings/githubcli-archive-keyring.gpg \
+          && echo "deb [arch=$(dpkg --print-architecture) signed-by=/usr/share/keyrings/githubcli-archive-keyring.gpg] https://cli.github.com/packages stable main" | sudo tee /etc/apt/sources.list.d/github-cli.list > /dev/null \
+          && sudo apt update \
+          && sudo apt install gh -y
+
       - name: Determine platform and version
         id: determine
         run: |
@@ -97,9 +105,13 @@ jobs:
             mkdir -p wheels/rocm
             echo "Downloading ROCm wheels from release ${ROCM_VERSION}"
             cd wheels/rocm
-            gh release download "${ROCM_VERSION}" \
+            if ! gh release download "${ROCM_VERSION}" \
               --repo EmbeddedLLM/fastsafetensors-rocm \
-              --pattern "*.whl" || echo "Warning: No ROCm wheels found for ${ROCM_VERSION}"
+              --pattern "*.whl"; then
+              echo "ERROR: Failed to download ROCm wheels from ${ROCM_VERSION}"
+              exit 1
+            fi
+            echo "Downloaded wheels:"
             ls -lah
             cd ../..
           fi
@@ -110,9 +122,13 @@ jobs:
             mkdir -p wheels/cuda
             echo "Downloading CUDA wheels from release ${CUDA_VERSION}"
             cd wheels/cuda
-            gh release download "${CUDA_VERSION}" \
+            if ! gh release download "${CUDA_VERSION}" \
               --repo EmbeddedLLM/fastsafetensors-rocm \
-              --pattern "*.whl" || echo "Warning: No CUDA wheels found for ${CUDA_VERSION}"
+              --pattern "*.whl"; then
+              echo "ERROR: Failed to download CUDA wheels from ${CUDA_VERSION}"
+              exit 1
+            fi
+            echo "Downloaded wheels:"
             ls -lah
             cd ../..
           fi

From 6a3f302e50147e1fd3b564f995c9bcbd95ae5b26 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 01:58:27 +0000
Subject: [PATCH 28/48] fix nested dumb-pypi

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 142eb71..01ffbaf 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -215,10 +215,11 @@ jobs:
               ls "${platform}/packages"/*.whl > "${platform}/package-list.txt"
 
               # Generate PEP 503 compliant index
+              # Note: dumb-pypi creates a /simple/ subdirectory inside output-dir
               dumb-pypi \
                 --package-list "${platform}/package-list.txt" \
                 --packages-url ../packages \
-                --output-dir "${platform}/simple" \
+                --output-dir "${platform}" \
                 --title "fastsafetensors ${platform^^} Index"
 
               echo "Generated ${platform} index for $(ls ${platform}/packages/*.whl | wc -l) wheels"

From c3a580b31a47802ee60e0c98d0109b3c66ea8e0b Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 02:04:35 +0000
Subject: [PATCH 29/48] fix publish to index

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 19 +++++++++++++++++--
 1 file changed, 17 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 01ffbaf..973cf10 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -204,6 +204,12 @@ jobs:
 
             echo "Generating index for ${platform}..."
 
+            # Clean up old index files to avoid conflicts
+            rm -rf "${platform}/simple"
+            rm -f "${platform}/package-list.txt"
+            rm -f "${platform}/index.html"
+            rm -f "${platform}/packages.json"
+
             # Create directory structure
             mkdir -p "${platform}/packages"
 
@@ -211,11 +217,15 @@ jobs:
             if [ -d "../wheels/${platform}" ] && [ "$(ls -A ../wheels/${platform}/*.whl 2>/dev/null)" ]; then
               cp ../wheels/${platform}/*.whl "${platform}/packages/"
 
-              # Generate package list
-              ls "${platform}/packages"/*.whl > "${platform}/package-list.txt"
+              # Generate package list with absolute paths
+              find "${platform}/packages" -name "*.whl" -type f > "${platform}/package-list.txt"
+
+              echo "Package list contents:"
+              cat "${platform}/package-list.txt"
 
               # Generate PEP 503 compliant index
               # Note: dumb-pypi creates a /simple/ subdirectory inside output-dir
+              # packages-url is relative from simple/ to packages/: ../packages
               dumb-pypi \
                 --package-list "${platform}/package-list.txt" \
                 --packages-url ../packages \
@@ -223,6 +233,11 @@ jobs:
                 --title "fastsafetensors ${platform^^} Index"
 
               echo "Generated ${platform} index for $(ls ${platform}/packages/*.whl | wc -l) wheels"
+
+              # Debug: show generated structure
+              echo "Generated structure:"
+              ls -la "${platform}/simple/" || echo "No simple/ directory created"
+              ls -la "${platform}/simple/fastsafetensors/" || echo "No fastsafetensors/ directory created"
             else
               echo "No wheels found for ${platform}, skipping index generation"
             fi

From 4eca2b7a8bc3330493204938a7c967d1a9bdb9cb Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 02:15:43 +0000
Subject: [PATCH 30/48] fix the dumb-pypi

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 18 ++++++++++--------
 1 file changed, 10 insertions(+), 8 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 973cf10..f3f1c8f 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -217,20 +217,22 @@ jobs:
             if [ -d "../wheels/${platform}" ] && [ "$(ls -A ../wheels/${platform}/*.whl 2>/dev/null)" ]; then
               cp ../wheels/${platform}/*.whl "${platform}/packages/"
 
-              # Generate package list with absolute paths
-              find "${platform}/packages" -name "*.whl" -type f > "${platform}/package-list.txt"
+              # Generate package list with just filenames (dumb-pypi doesn't accept paths with /)
+              (cd "${platform}/packages" && ls *.whl) > "${platform}/package-list.txt"
 
               echo "Package list contents:"
               cat "${platform}/package-list.txt"
 
               # Generate PEP 503 compliant index
-              # Note: dumb-pypi creates a /simple/ subdirectory inside output-dir
+              # Note: dumb-pypi expects wheel files to be accessible from where it runs
+              # Run from packages/ directory so dumb-pypi can find the wheels by filename
               # packages-url is relative from simple/ to packages/: ../packages
-              dumb-pypi \
-                --package-list "${platform}/package-list.txt" \
-                --packages-url ../packages \
-                --output-dir "${platform}" \
-                --title "fastsafetensors ${platform^^} Index"
+              (cd "${platform}/packages" && \
+                dumb-pypi \
+                  --package-list ../package-list.txt \
+                  --packages-url ../packages \
+                  --output-dir .. \
+                  --title "fastsafetensors ${platform^^} Index")
 
               echo "Generated ${platform} index for $(ls ${platform}/packages/*.whl | wc -l) wheels"
 

From 2f158982d17fd70a855e35c17f3bc3b7d12355e2 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 02:22:27 +0000
Subject: [PATCH 31/48] fix the package path

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index f3f1c8f..e3650f3 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -226,11 +226,11 @@ jobs:
               # Generate PEP 503 compliant index
               # Note: dumb-pypi expects wheel files to be accessible from where it runs
               # Run from packages/ directory so dumb-pypi can find the wheels by filename
-              # packages-url is relative from simple/ to packages/: ../packages
+              # packages-url is relative from simple/fastsafetensors/ to packages/: ../../packages
               (cd "${platform}/packages" && \
                 dumb-pypi \
                   --package-list ../package-list.txt \
-                  --packages-url ../packages \
+                  --packages-url ../../packages \
                   --output-dir .. \
                   --title "fastsafetensors ${platform^^} Index")
 

From 8ffcefa679ed68386667ad2479024195571df887 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 04:50:15 +0000
Subject: [PATCH 32/48] lint

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 fastsafetensors/copier/gds.py         | 2 +-
 fastsafetensors/frameworks/_paddle.py | 4 ++--
 fastsafetensors/frameworks/_torch.py  | 4 ++--
 tests/test_fastsafetensors.py         | 8 +++-----
 4 files changed, 8 insertions(+), 10 deletions(-)

diff --git a/fastsafetensors/copier/gds.py b/fastsafetensors/copier/gds.py
index dc24f1f..c212d0d 100644
--- a/fastsafetensors/copier/gds.py
+++ b/fastsafetensors/copier/gds.py
@@ -28,7 +28,7 @@ def __init__(
         self.copy_reqs: Dict[int, int] = {}
         self.aligned_length = 0
         cuda_ver = framework.get_cuda_ver()
-        if cuda_ver and cuda_ver != "none":
+        if cuda_ver and cuda_ver != "0.0":
             # Parse version string (e.g., "cuda-12.1" or "hip-5.7.0")
             # Extract the numeric part after the platform prefix
             ver_parts = cuda_ver.split("-", 1)
diff --git a/fastsafetensors/frameworks/_paddle.py b/fastsafetensors/frameworks/_paddle.py
index 7592d31..8ced6eb 100644
--- a/fastsafetensors/frameworks/_paddle.py
+++ b/fastsafetensors/frameworks/_paddle.py
@@ -217,7 +217,7 @@ def get_cuda_ver(self) -> str:
         """Get GPU runtime version with platform indicator.
 
         Returns a string like 'hip-5.7.0' for ROCm or 'cuda-12.1' for CUDA,
-        or 'none' if no GPU is available. This allows code to distinguish
+        or '0.0' if no GPU is available. This allows code to distinguish
         between different GPU platforms without using paddle directly.
         """
         if paddle.device.is_compiled_with_cuda():
@@ -225,7 +225,7 @@ def get_cuda_ver(self) -> str:
             if paddle.device.is_compiled_with_rocm():
                 return f"hip-{paddle.version.cuda()}"
             return f"cuda-{paddle.version.cuda()}"
-        return "none"
+        return "0.0"
 
     def get_device_ptr_align(self) -> int:
         CUDA_PTR_ALIGN: int = 16
diff --git a/fastsafetensors/frameworks/_torch.py b/fastsafetensors/frameworks/_torch.py
index affa214..aeb8084 100644
--- a/fastsafetensors/frameworks/_torch.py
+++ b/fastsafetensors/frameworks/_torch.py
@@ -189,7 +189,7 @@ def get_cuda_ver(self) -> str:
         """Get GPU runtime version with platform indicator.
 
         Returns a string like 'hip-5.7.0' for ROCm or 'cuda-12.1' for CUDA,
-        or 'none' if no GPU is available. This allows code to distinguish
+        or '0.0' if no GPU is available. This allows code to distinguish
         between different GPU platforms without using torch directly.
         """
         if torch.cuda.is_available():
@@ -197,7 +197,7 @@ def get_cuda_ver(self) -> str:
             if hasattr(torch.version, "hip") and torch.version.hip is not None:
                 return f"hip-{torch.version.hip}"
             return f"cuda-{torch.version.cuda}"
-        return "none"
+        return "0.0"
 
     def get_device_ptr_align(self) -> int:
         CUDA_PTR_ALIGN: int = 16
diff --git a/tests/test_fastsafetensors.py b/tests/test_fastsafetensors.py
index 118e2ca..1f4ff28 100644
--- a/tests/test_fastsafetensors.py
+++ b/tests/test_fastsafetensors.py
@@ -113,11 +113,9 @@ def test_framework(fstcpp_log, framework) -> None:
     # Test that get_cuda_ver() returns a string with platform prefix
     cuda_ver = framework.get_cuda_ver()
     assert isinstance(cuda_ver, str)
-    # Should be "hip-X.Y.Z", "cuda-X.Y", or "none"
+    # Should be "hip-X.Y.Z", "cuda-X.Y", or "0.0"
     assert (
-        cuda_ver.startswith("hip-")
-        or cuda_ver.startswith("cuda-")
-        or cuda_ver == "none"
+        cuda_ver.startswith("hip-") or cuda_ver.startswith("cuda-") or cuda_ver == "0.0"
     )
 
     # Verify it matches what torch reports
@@ -132,7 +130,7 @@ def test_framework(fstcpp_log, framework) -> None:
                 assert cuda_ver.startswith("cuda-")
                 assert str(torch.version.cuda) in cuda_ver
         else:
-            assert cuda_ver == "none"
+            assert cuda_ver == "0.0"
 
 
 def test_get_framework_fail(fstcpp_log) -> None:

From f09cb5430440b12aafe452885379116b35debcb5 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 04:57:52 +0000
Subject: [PATCH 33/48] remove deploy-pypi-index

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/scripts/generate_pypi_index.py   | 228 -----------------------
 .github/workflows/deploy-pypi-index.yaml |  51 -----
 2 files changed, 279 deletions(-)
 delete mode 100755 .github/scripts/generate_pypi_index.py
 delete mode 100644 .github/workflows/deploy-pypi-index.yaml

diff --git a/.github/scripts/generate_pypi_index.py b/.github/scripts/generate_pypi_index.py
deleted file mode 100755
index eb360d9..0000000
--- a/.github/scripts/generate_pypi_index.py
+++ /dev/null
@@ -1,228 +0,0 @@
-#!/usr/bin/env python3
-"""
-Generate PyPI-compatible simple index from GitHub releases.
-This script fetches all releases and creates separate indexes for CUDA and ROCm wheels.
-"""
-
-import json
-import os
-import sys
-from pathlib import Path
-from urllib.request import urlopen, Request
-
-def fetch_releases(repo_owner, repo_name):
-    """Fetch all releases from GitHub API."""
-    url = f"https://api.github.com/repos/{repo_owner}/{repo_name}/releases"
-    headers = {
-        "Accept": "application/vnd.github.v3+json",
-        "User-Agent": "PyPI-Index-Generator"
-    }
-
-    # Add GitHub token if available (for higher rate limits)
-    token = os.environ.get("GITHUB_TOKEN")
-    if token:
-        headers["Authorization"] = f"token {token}"
-
-    request = Request(url, headers=headers)
-
-    try:
-        with urlopen(request) as response:
-            return json.loads(response.read().decode())
-    except Exception as e:
-        print(f"Error fetching releases: {e}", file=sys.stderr)
-        sys.exit(1)
-
-def categorize_backend(release_tag):
-    """Determine backend (cuda/rocm) from release tag."""
-    tag_lower = release_tag.lower()
-
-    if "rocm" in tag_lower:
-        return "rocm"
-    elif "cuda" in tag_lower:
-        return "cuda"
-    else:
-        # Default to cuda for untagged releases
-        return "cuda"
-
-def extract_wheels_by_backend(releases):
-    """Extract wheel files from releases, categorized by backend."""
-    wheels_by_backend = {
-        "cuda": [],
-        "rocm": []
-    }
-
-    for release in releases:
-        backend = categorize_backend(release.get("tag_name", ""))
-
-        for asset in release.get("assets", []):
-            name = asset.get("name", "")
-            if name.endswith(".whl"):
-                wheels_by_backend[backend].append({
-                    "name": name,
-                    "url": asset.get("browser_download_url"),
-                    "version": release.get("tag_name"),
-                })
-
-    return wheels_by_backend
-
-def generate_root_index(output_dir, packages):
-    """Generate the root simple index."""
-    html = """<!DOCTYPE html>
-<html>
-<head>
-    <meta charset="UTF-8">
-    <title>Simple Index</title>
-</head>
-<body>
-    <h1>Simple Index</h1>
-"""
-
-    for package in sorted(packages):
-        html += f'    <a href="{package}/">{package}</a><br/>\n'
-
-    html += """</body>
-</html>
-"""
-
-    output_path = output_dir / "index.html"
-    output_path.write_text(html)
-    print(f"Generated: {output_path}")
-
-def generate_package_index(output_dir, package_name, wheels):
-    """Generate package-specific index with all wheels."""
-    html = f"""<!DOCTYPE html>
-<html>
-<head>
-    <meta charset="UTF-8">
-    <title>Links for {package_name}</title>
-</head>
-<body>
-    <h1>Links for {package_name}</h1>
-"""
-
-    # Sort wheels by version and Python version
-    sorted_wheels = sorted(wheels, key=lambda w: (w["name"], w["version"]), reverse=True)
-
-    for wheel in sorted_wheels:
-        # Extract package name from wheel filename to ensure consistency
-        wheel_name = wheel["name"]
-        url = wheel["url"]
-        html += f'    <a href="{url}#sha256=">{wheel_name}</a><br/>\n'
-
-    html += """</body>
-</html>
-"""
-
-    package_dir = output_dir / package_name
-    package_dir.mkdir(parents=True, exist_ok=True)
-
-    output_path = package_dir / "index.html"
-    output_path.write_text(html)
-    print(f"Generated: {output_path}")
-
-def generate_landing_page(base_dir, repo_name):
-    """Generate a landing page for the PyPI index."""
-    html = f"""<!DOCTYPE html>
-<html>
-<head>
-    <meta charset="UTF-8">
-    <title>{repo_name} - PyPI Index</title>
-    <style>
-        body {{ font-family: system-ui, -apple-system, sans-serif; max-width: 800px; margin: 50px auto; padding: 20px; }}
-        h1 {{ color: #2c3e50; }}
-        .backend {{ margin: 30px 0; padding: 20px; background: #f8f9fa; border-radius: 8px; }}
-        code {{ background: #e9ecef; padding: 2px 6px; border-radius: 4px; font-size: 0.9em; }}
-        pre {{ background: #2c3e50; color: #ecf0f1; padding: 15px; border-radius: 6px; overflow-x: auto; }}
-    </style>
-</head>
-<body>
-    <h1>{repo_name} - PyPI Index</h1>
-    <p>Choose the appropriate index URL based on your GPU backend:</p>
-
-    <div class="backend">
-        <h2>🔥 ROCm (AMD GPUs)</h2>
-        <p>For AMD GPUs using ROCm:</p>
-        <pre>pip install fastsafetensors --index-url https://embeddedllm.github.io/{repo_name}/rocm/simple/</pre>
-    </div>
-
-    <div class="backend">
-        <h2>💚 CUDA (NVIDIA GPUs)</h2>
-        <p>For NVIDIA GPUs using CUDA:</p>
-        <pre>pip install fastsafetensors --index-url https://embeddedllm.github.io/{repo_name}/cuda/simple/</pre>
-    </div>
-
-    <h3>Version Specific Installation</h3>
-    <pre>pip install fastsafetensors==0.1.15 --index-url https://embeddedllm.github.io/{repo_name}/rocm/simple/</pre>
-
-    <h3>In requirements.txt</h3>
-    <pre>--index-url https://embeddedllm.github.io/{repo_name}/rocm/simple/
-fastsafetensors>=0.1.15</pre>
-
-    <hr>
-    <p><small>Direct access: <a href="rocm/simple/">ROCm Index</a> | <a href="cuda/simple/">CUDA Index</a></small></p>
-</body>
-</html>
-"""
-
-    output_path = base_dir / "index.html"
-    output_path.write_text(html)
-    print(f"Generated landing page: {output_path}")
-
-def main():
-    # Configuration
-    repo_owner = os.environ.get("GITHUB_REPOSITORY_OWNER", "EmbeddedLLM")
-    repo_full = os.environ.get("GITHUB_REPOSITORY", "EmbeddedLLM/fastsafetensors-rocm")
-    repo_name = repo_full.split("/")[-1]
-
-    print(f"Fetching releases from {repo_owner}/{repo_name}...")
-    releases = fetch_releases(repo_owner, repo_name)
-    print(f"Found {len(releases)} releases")
-
-    # Extract wheels categorized by backend
-    wheels_by_backend = extract_wheels_by_backend(releases)
-
-    total_wheels = sum(len(wheels) for wheels in wheels_by_backend.values())
-    print(f"Found {total_wheels} total wheel files")
-    print(f"  CUDA: {len(wheels_by_backend['cuda'])} wheels")
-    print(f"  ROCm: {len(wheels_by_backend['rocm'])} wheels")
-
-    if total_wheels == 0:
-        print("Warning: No wheel files found in any release", file=sys.stderr)
-        return
-
-    # Generate indexes for each backend
-    for backend, wheels in wheels_by_backend.items():
-        if not wheels:
-            print(f"Skipping {backend} index (no wheels found)")
-            continue
-
-        print(f"\nGenerating {backend.upper()} index...")
-        output_dir = Path(f"pypi-index/{backend}/simple")
-        output_dir.mkdir(parents=True, exist_ok=True)
-
-        # Group wheels by package name
-        packages = {}
-        for wheel in wheels:
-            # Extract package name from wheel filename (before first dash)
-            package_name = wheel["name"].split("-")[0]
-            if package_name not in packages:
-                packages[package_name] = []
-            packages[package_name].append(wheel)
-
-        # Generate indexes
-        generate_root_index(output_dir, packages.keys())
-
-        for package_name, package_wheels in packages.items():
-            generate_package_index(output_dir, package_name, package_wheels)
-
-        print(f"  Generated {backend.upper()} index with {len(packages)} package(s)")
-
-    # Generate landing page
-    base_dir = Path("pypi-index")
-    generate_landing_page(base_dir, repo_name)
-
-    print(f"\n✓ Successfully generated indexes for all backends")
-    print(f"  Total wheels: {total_wheels}")
-
-if __name__ == "__main__":
-    main()
diff --git a/.github/workflows/deploy-pypi-index.yaml b/.github/workflows/deploy-pypi-index.yaml
deleted file mode 100644
index e56efb8..0000000
--- a/.github/workflows/deploy-pypi-index.yaml
+++ /dev/null
@@ -1,51 +0,0 @@
-name: Deploy PyPI Index to GitHub Pages
-
-on:
-  workflow_dispatch:
-
-permissions:
-  contents: read
-  pages: write
-  id-token: write
-
-concurrency:
-  group: "pages"
-  cancel-in-progress: false
-
-jobs:
-  build:
-    runs-on: ubuntu-latest
-    steps:
-      - name: Checkout
-        uses: actions/checkout@v4
-
-      - name: Set up Python
-        uses: actions/setup-python@v5
-        with:
-          python-version: '3.11'
-
-      - name: Generate PyPI index from releases
-        env:
-          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-        run: |
-          chmod +x .github/scripts/generate_pypi_index.py
-          python .github/scripts/generate_pypi_index.py
-
-      - name: Setup Pages
-        uses: actions/configure-pages@v4
-
-      - name: Upload artifact
-        uses: actions/upload-pages-artifact@v3
-        with:
-          path: ./pypi-index
-
-  deploy:
-    environment:
-      name: github-pages
-      url: ${{ steps.deployment.outputs.page_url }}
-    runs-on: ubuntu-latest
-    needs: build
-    steps:
-      - name: Deploy to GitHub Pages
-        id: deployment
-        uses: actions/deploy-pages@v4

From 821fb41ad72840428dcf91b6c11baa0abeeb8760 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 05:08:45 +0000
Subject: [PATCH 34/48] remove unused code

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 tests/platform_utils.py | 22 ----------------------
 1 file changed, 22 deletions(-)

diff --git a/tests/platform_utils.py b/tests/platform_utils.py
index e0b4498..d9da5f6 100644
--- a/tests/platform_utils.py
+++ b/tests/platform_utils.py
@@ -29,18 +29,6 @@ def is_cuda_platform():
     "test_GdsFileCopier",  # GDS not available on AMD
 }
 
-# List of tests with memory leak detection issues on ROCm (non-critical)
-ROCM_MEMORY_LEAK_TESTS = {
-    "test_SafeTensorsFileLoader",
-    "test_SafeTensorsFileLoaderNoGds",
-    "test_fastsafe_open",
-    "test_int8",
-    "test_float8_e5m2",
-    "test_float8_e4m3fn",
-    "test_float8_e4m3fn_to_int8",
-    "test_cpp_metrics",
-}
-
 
 def skip_if_rocm_expected_failure(test_name):
     """Skip test if it's an expected failure on ROCm."""
@@ -50,16 +38,6 @@ def skip_if_rocm_expected_failure(test_name):
         )
 
 
-def xfail_if_rocm_memory_leak(test_name):
-    """Mark test as expected to fail on ROCm due to memory leak detection issues."""
-    if is_rocm_platform() and test_name in ROCM_MEMORY_LEAK_TESTS:
-        return pytest.mark.xfail(
-            reason=f"Test '{test_name}' has memory leak detection issues on ROCm (non-critical)",
-            strict=False,
-        )
-    return lambda func: func
-
-
 def get_platform_info():
     """Get platform information for debugging.
 

From e9ff27f67372494d1f760908d4b3310618bbc8f5 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 05:37:50 +0000
Subject: [PATCH 35/48] update publish to index to handle version isolation

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 155 +++++++++++++++++++++++-
 1 file changed, 152 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index e3650f3..8609d9c 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -133,6 +133,93 @@ jobs:
             cd ../..
           fi
 
+      - name: Extract dependencies from wheels
+        run: |
+          PLATFORM="${{ steps.determine.outputs.platform }}"
+          VERSION="${{ steps.determine.outputs.version }}"
+
+          # Python script to extract dependencies from wheel metadata
+          cat > extract_deps.py << 'PYTHON_SCRIPT'
+import sys
+import zipfile
+import re
+from pathlib import Path
+
+def extract_dependencies(wheel_path):
+    """Extract Requires-Dist from wheel METADATA."""
+    dependencies = []
+
+    try:
+        with zipfile.ZipFile(wheel_path, 'r') as whl:
+            # Find METADATA file (usually in *.dist-info/METADATA)
+            metadata_files = [f for f in whl.namelist() if f.endswith('.dist-info/METADATA')]
+
+            if not metadata_files:
+                print(f"Warning: No METADATA found in {wheel_path}", file=sys.stderr)
+                return dependencies
+
+            metadata_content = whl.read(metadata_files[0]).decode('utf-8')
+
+            # Parse Requires-Dist lines
+            for line in metadata_content.split('\n'):
+                line = line.strip()
+                if line.startswith('Requires-Dist:'):
+                    # Extract dependency specification
+                    dep = line.split(':', 1)[1].strip()
+                    # Remove extras and environment markers
+                    dep = re.split(r'\s*;\s*', dep)[0]
+                    dep = re.split(r'\s*\[', dep)[0]
+                    dependencies.append(dep)
+
+    except Exception as e:
+        print(f"Error reading {wheel_path}: {e}", file=sys.stderr)
+
+    return dependencies
+
+if __name__ == "__main__":
+    wheel_dir = sys.argv[1]
+    wheel_files = list(Path(wheel_dir).glob("fastsafetensors-*.whl"))
+
+    if not wheel_files:
+        print("Error: No fastsafetensors wheels found", file=sys.stderr)
+        sys.exit(1)
+
+    # Use first wheel (all should have same dependencies)
+    wheel_path = wheel_files[0]
+    print(f"Extracting dependencies from: {wheel_path.name}", file=sys.stderr)
+
+    deps = extract_dependencies(wheel_path)
+
+    # Output dependencies one per line
+    for dep in deps:
+        print(dep)
+PYTHON_SCRIPT
+
+          # Extract dependencies for each platform
+          extract_deps_for_platform() {
+            local platform=$1
+            local wheel_dir="wheels/${platform}"
+
+            if [ ! -d "${wheel_dir}" ]; then
+              echo "No wheels directory for ${platform}"
+              return
+            fi
+
+            echo "Extracting dependencies from ${platform} wheels..."
+            python extract_deps.py "${wheel_dir}" > "${wheel_dir}/requirements.txt" 2>&1
+
+            echo "Extracted dependencies:"
+            cat "${wheel_dir}/requirements.txt"
+          }
+
+          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
+            extract_deps_for_platform "rocm"
+          fi
+
+          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
+            extract_deps_for_platform "cuda"
+          fi
+
       - name: Download all dependencies
         run: |
           PLATFORM="${{ steps.determine.outputs.platform }}"
@@ -141,14 +228,20 @@ jobs:
           download_deps() {
             local platform=$1
             local dest_dir="wheels/${platform}"
+            local req_file="${dest_dir}/requirements.txt"
 
             echo "Downloading dependencies for ${platform}..."
 
+            if [ ! -f "${req_file}" ]; then
+              echo "No requirements file found for ${platform}, skipping"
+              return
+            fi
+
             # For each Python version, download dependencies
             for py_ver in 3.9 3.10 3.11 3.12 3.13; do
               echo "Downloading dependencies for Python ${py_ver}"
 
-              # Download dependencies using current Python (pip handles version compatibility)
+              # Download dependencies using extracted requirements
               python -m pip download \
                 --dest "${dest_dir}" \
                 --only-binary :all: \
@@ -157,14 +250,14 @@ jobs:
                 --platform manylinux_2_17_x86_64 \
                 --platform manylinux_2_27_x86_64 \
                 --platform manylinux_2_28_x86_64 \
-                typer 2>/dev/null || echo "Some downloads failed for Python ${py_ver}"
+                -r "${req_file}" 2>/dev/null || echo "Some downloads failed for Python ${py_ver}"
             done
 
             # Also download using current Python for any missing wheels
             python -m pip download \
               --dest "${dest_dir}" \
               --only-binary :all: \
-              typer || true
+              -r "${req_file}" || true
 
             # Summary
             if [ -d "${dest_dir}" ] && [ "$(ls -A ${dest_dir}/*.whl 2>/dev/null)" ]; then
@@ -197,10 +290,12 @@ jobs:
         run: |
           cd gh-pages-repo
           PLATFORM="${{ steps.determine.outputs.platform }}"
+          VERSION="${{ steps.determine.outputs.version }}"
 
           # Function to generate index for a platform
           generate_index() {
             local platform=$1
+            local version="${VERSION}"
 
             echo "Generating index for ${platform}..."
 
@@ -212,9 +307,19 @@ jobs:
 
             # Create directory structure
             mkdir -p "${platform}/packages"
+            mkdir -p "${platform}/manifests"
 
             # Copy all wheels
             if [ -d "../wheels/${platform}" ] && [ "$(ls -A ../wheels/${platform}/*.whl 2>/dev/null)" ]; then
+              # Extract version number (remove 'v' prefix if present)
+              local clean_version="${version#v}"
+
+              # Remove OLD wheels for the SAME version only
+              echo "Removing old fastsafetensors-${clean_version} wheels..."
+              rm -f "${platform}/packages/fastsafetensors-${clean_version}"-*.whl || true
+
+              # Copy new wheels
+              echo "Copying new wheels..."
               cp ../wheels/${platform}/*.whl "${platform}/packages/"
 
               # Generate package list with just filenames (dumb-pypi doesn't accept paths with /)
@@ -223,6 +328,50 @@ jobs:
               echo "Package list contents:"
               cat "${platform}/package-list.txt"
 
+              # Create manifest for this version
+              echo "Creating manifest for version ${clean_version}..."
+              local manifest_file="${platform}/manifests/v${clean_version}.json"
+
+              # Read dependencies from requirements.txt
+              local deps_json="[]"
+              if [ -f "../wheels/${platform}/requirements.txt" ]; then
+                deps_json=$(python3 -c "
+import json
+with open('../wheels/${platform}/requirements.txt') as f:
+    deps = [line.strip() for line in f if line.strip() and not line.startswith('#')]
+print(json.dumps(deps))
+")
+              fi
+
+              # List fastsafetensors wheels
+              local fst_wheels_json=$(cd "${platform}/packages" && python3 -c "
+import json, glob
+wheels = sorted([f for f in glob.glob('fastsafetensors-${clean_version}-*.whl')])
+print(json.dumps(wheels))
+")
+
+              # List all downloaded wheels
+              local all_wheels_json=$(cd "${platform}/packages" && python3 -c "
+import json, glob
+wheels = sorted(glob.glob('*.whl'))
+print(json.dumps(wheels))
+")
+
+              # Create manifest JSON
+              cat > "${manifest_file}" << EOF
+{
+  "fastsafetensors_version": "${clean_version}",
+  "published_at": "$(date -u +%Y-%m-%dT%H:%M:%SZ)",
+  "platform": "${platform}",
+  "dependencies": ${deps_json},
+  "fastsafetensors_wheels": ${fst_wheels_json},
+  "total_wheels_in_index": $(echo ${all_wheels_json} | python3 -c "import json, sys; print(len(json.load(sys.stdin)))")
+}
+EOF
+
+              echo "Created manifest:"
+              cat "${manifest_file}"
+
               # Generate PEP 503 compliant index
               # Note: dumb-pypi expects wheel files to be accessible from where it runs
               # Run from packages/ directory so dumb-pypi can find the wheels by filename

From eff48c76096ade2e8c3131ef0387ed74c614e49e Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 05:41:56 +0000
Subject: [PATCH 36/48] fix publish to index yaml syntax

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 77 ++++++++++++-------------
 1 file changed, 37 insertions(+), 40 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 8609d9c..ad031be 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -138,37 +138,46 @@ jobs:
           PLATFORM="${{ steps.determine.outputs.platform }}"
           VERSION="${{ steps.determine.outputs.version }}"
 
-          # Python script to extract dependencies from wheel metadata
-          cat > extract_deps.py << 'PYTHON_SCRIPT'
+          # Extract dependencies for each platform
+          extract_deps_for_platform() {
+            local platform=$1
+            export WHEEL_DIR="wheels/${platform}"
+            export OUTPUT_FILE="wheels/${platform}/requirements.txt"
+
+            if [ ! -d "${WHEEL_DIR}" ]; then
+              echo "No wheels directory for ${platform}"
+              return
+            fi
+
+            echo "Extracting dependencies from ${platform} wheels..."
+
+            python3 -c '
 import sys
 import zipfile
 import re
 from pathlib import Path
+import os
 
 def extract_dependencies(wheel_path):
     """Extract Requires-Dist from wheel METADATA."""
     dependencies = []
 
     try:
-        with zipfile.ZipFile(wheel_path, 'r') as whl:
-            # Find METADATA file (usually in *.dist-info/METADATA)
-            metadata_files = [f for f in whl.namelist() if f.endswith('.dist-info/METADATA')]
+        with zipfile.ZipFile(wheel_path, "r") as whl:
+            metadata_files = [f for f in whl.namelist() if f.endswith(".dist-info/METADATA")]
 
             if not metadata_files:
                 print(f"Warning: No METADATA found in {wheel_path}", file=sys.stderr)
                 return dependencies
 
-            metadata_content = whl.read(metadata_files[0]).decode('utf-8')
+            metadata_content = whl.read(metadata_files[0]).decode("utf-8")
 
-            # Parse Requires-Dist lines
-            for line in metadata_content.split('\n'):
+            for line in metadata_content.split("\n"):
                 line = line.strip()
-                if line.startswith('Requires-Dist:'):
-                    # Extract dependency specification
-                    dep = line.split(':', 1)[1].strip()
-                    # Remove extras and environment markers
-                    dep = re.split(r'\s*;\s*', dep)[0]
-                    dep = re.split(r'\s*\[', dep)[0]
+                if line.startswith("Requires-Dist:"):
+                    dep = line.split(":", 1)[1].strip()
+                    dep = re.split(r"\s*;\s*", dep)[0]
+                    dep = re.split(r"\s*\[", dep)[0]
                     dependencies.append(dep)
 
     except Exception as e:
@@ -176,40 +185,28 @@ def extract_dependencies(wheel_path):
 
     return dependencies
 
-if __name__ == "__main__":
-    wheel_dir = sys.argv[1]
-    wheel_files = list(Path(wheel_dir).glob("fastsafetensors-*.whl"))
+wheel_dir = os.environ["WHEEL_DIR"]
+output_file = os.environ["OUTPUT_FILE"]
+wheel_files = list(Path(wheel_dir).glob("fastsafetensors-*.whl"))
 
-    if not wheel_files:
-        print("Error: No fastsafetensors wheels found", file=sys.stderr)
-        sys.exit(1)
+if not wheel_files:
+    print("Error: No fastsafetensors wheels found", file=sys.stderr)
+    sys.exit(1)
 
-    # Use first wheel (all should have same dependencies)
-    wheel_path = wheel_files[0]
-    print(f"Extracting dependencies from: {wheel_path.name}", file=sys.stderr)
+wheel_path = wheel_files[0]
+print(f"Extracting dependencies from: {wheel_path.name}", file=sys.stderr)
 
-    deps = extract_dependencies(wheel_path)
+deps = extract_dependencies(wheel_path)
 
-    # Output dependencies one per line
+with open(output_file, "w") as f:
     for dep in deps:
-        print(dep)
-PYTHON_SCRIPT
+        f.write(dep + "\n")
 
-          # Extract dependencies for each platform
-          extract_deps_for_platform() {
-            local platform=$1
-            local wheel_dir="wheels/${platform}"
-
-            if [ ! -d "${wheel_dir}" ]; then
-              echo "No wheels directory for ${platform}"
-              return
-            fi
-
-            echo "Extracting dependencies from ${platform} wheels..."
-            python extract_deps.py "${wheel_dir}" > "${wheel_dir}/requirements.txt" 2>&1
+print(f"Wrote {len(deps)} dependencies to {output_file}", file=sys.stderr)
+'
 
             echo "Extracted dependencies:"
-            cat "${wheel_dir}/requirements.txt"
+            cat "${OUTPUT_FILE}"
           }
 
           if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then

From 4dcbb76d9a86f8b2ef95a1d4f2516d8dd03150a3 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 05:48:05 +0000
Subject: [PATCH 37/48] fix publish to index syntax error

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 98 +++----------------------
 1 file changed, 11 insertions(+), 87 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index ad031be..89192f0 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -138,75 +138,21 @@ jobs:
           PLATFORM="${{ steps.determine.outputs.platform }}"
           VERSION="${{ steps.determine.outputs.version }}"
 
-          # Extract dependencies for each platform
           extract_deps_for_platform() {
             local platform=$1
-            export WHEEL_DIR="wheels/${platform}"
-            export OUTPUT_FILE="wheels/${platform}/requirements.txt"
+            local wheel_dir="wheels/${platform}"
+            local output_file="wheels/${platform}/requirements.txt"
 
-            if [ ! -d "${WHEEL_DIR}" ]; then
+            if [ ! -d "${wheel_dir}" ]; then
               echo "No wheels directory for ${platform}"
               return
             fi
 
             echo "Extracting dependencies from ${platform} wheels..."
-
-            python3 -c '
-import sys
-import zipfile
-import re
-from pathlib import Path
-import os
-
-def extract_dependencies(wheel_path):
-    """Extract Requires-Dist from wheel METADATA."""
-    dependencies = []
-
-    try:
-        with zipfile.ZipFile(wheel_path, "r") as whl:
-            metadata_files = [f for f in whl.namelist() if f.endswith(".dist-info/METADATA")]
-
-            if not metadata_files:
-                print(f"Warning: No METADATA found in {wheel_path}", file=sys.stderr)
-                return dependencies
-
-            metadata_content = whl.read(metadata_files[0]).decode("utf-8")
-
-            for line in metadata_content.split("\n"):
-                line = line.strip()
-                if line.startswith("Requires-Dist:"):
-                    dep = line.split(":", 1)[1].strip()
-                    dep = re.split(r"\s*;\s*", dep)[0]
-                    dep = re.split(r"\s*\[", dep)[0]
-                    dependencies.append(dep)
-
-    except Exception as e:
-        print(f"Error reading {wheel_path}: {e}", file=sys.stderr)
-
-    return dependencies
-
-wheel_dir = os.environ["WHEEL_DIR"]
-output_file = os.environ["OUTPUT_FILE"]
-wheel_files = list(Path(wheel_dir).glob("fastsafetensors-*.whl"))
-
-if not wheel_files:
-    print("Error: No fastsafetensors wheels found", file=sys.stderr)
-    sys.exit(1)
-
-wheel_path = wheel_files[0]
-print(f"Extracting dependencies from: {wheel_path.name}", file=sys.stderr)
-
-deps = extract_dependencies(wheel_path)
-
-with open(output_file, "w") as f:
-    for dep in deps:
-        f.write(dep + "\n")
-
-print(f"Wrote {len(deps)} dependencies to {output_file}", file=sys.stderr)
-'
+            python3 fastsafetensors-rocm/.github/scripts/extract_wheel_deps.py "${wheel_dir}" "${output_file}"
 
             echo "Extracted dependencies:"
-            cat "${OUTPUT_FILE}"
+            cat "${output_file}"
           }
 
           if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
@@ -332,39 +278,17 @@ print(f"Wrote {len(deps)} dependencies to {output_file}", file=sys.stderr)
               # Read dependencies from requirements.txt
               local deps_json="[]"
               if [ -f "../wheels/${platform}/requirements.txt" ]; then
-                deps_json=$(python3 -c "
-import json
-with open('../wheels/${platform}/requirements.txt') as f:
-    deps = [line.strip() for line in f if line.strip() and not line.startswith('#')]
-print(json.dumps(deps))
-")
+                deps_json=$(python3 -c 'import json,sys; print(json.dumps([line.strip() for line in open("../wheels/'${platform}'/requirements.txt") if line.strip() and not line.startswith("#")]))')
               fi
 
               # List fastsafetensors wheels
-              local fst_wheels_json=$(cd "${platform}/packages" && python3 -c "
-import json, glob
-wheels = sorted([f for f in glob.glob('fastsafetensors-${clean_version}-*.whl')])
-print(json.dumps(wheels))
-")
+              local fst_wheels_json=$(cd "${platform}/packages" && python3 -c 'import json,glob; print(json.dumps(sorted(glob.glob("fastsafetensors-'${clean_version}'-*.whl"))))')
 
               # List all downloaded wheels
-              local all_wheels_json=$(cd "${platform}/packages" && python3 -c "
-import json, glob
-wheels = sorted(glob.glob('*.whl'))
-print(json.dumps(wheels))
-")
-
-              # Create manifest JSON
-              cat > "${manifest_file}" << EOF
-{
-  "fastsafetensors_version": "${clean_version}",
-  "published_at": "$(date -u +%Y-%m-%dT%H:%M:%SZ)",
-  "platform": "${platform}",
-  "dependencies": ${deps_json},
-  "fastsafetensors_wheels": ${fst_wheels_json},
-  "total_wheels_in_index": $(echo ${all_wheels_json} | python3 -c "import json, sys; print(len(json.load(sys.stdin)))")
-}
-EOF
+              local all_wheels_json=$(cd "${platform}/packages" && python3 -c 'import json,glob; print(json.dumps(sorted(glob.glob("*.whl"))))')
+
+              # Create manifest JSON using Python
+              python3 -c "import json,sys; manifest={'fastsafetensors_version':'${clean_version}','published_at':'$(date -u +%Y-%m-%dT%H:%M:%SZ)','platform':'${platform}','dependencies':${deps_json},'fastsafetensors_wheels':${fst_wheels_json},'total_wheels_in_index':len(${all_wheels_json})}; json.dump(manifest,open('${manifest_file}','w'),indent=2)"
 
               echo "Created manifest:"
               cat "${manifest_file}"

From 86faab47d73103fc5ad20bd276154551feaf53df Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 05:48:32 +0000
Subject: [PATCH 38/48] add workflow python script

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/scripts/extract_wheel_deps.py | 75 +++++++++++++++++++++++++++
 1 file changed, 75 insertions(+)
 create mode 100644 .github/scripts/extract_wheel_deps.py

diff --git a/.github/scripts/extract_wheel_deps.py b/.github/scripts/extract_wheel_deps.py
new file mode 100644
index 0000000..79eff27
--- /dev/null
+++ b/.github/scripts/extract_wheel_deps.py
@@ -0,0 +1,75 @@
+#!/usr/bin/env python3
+"""Extract dependencies from wheel METADATA file."""
+
+import sys
+import zipfile
+import re
+from pathlib import Path
+
+
+def extract_dependencies(wheel_path):
+    """Extract Requires-Dist from wheel METADATA."""
+    dependencies = []
+
+    try:
+        with zipfile.ZipFile(wheel_path, "r") as whl:
+            # Find METADATA file
+            metadata_files = [
+                f for f in whl.namelist() if f.endswith(".dist-info/METADATA")
+            ]
+
+            if not metadata_files:
+                print(f"Warning: No METADATA found in {wheel_path}", file=sys.stderr)
+                return dependencies
+
+            metadata_content = whl.read(metadata_files[0]).decode("utf-8")
+
+            # Parse Requires-Dist lines
+            for line in metadata_content.split("\n"):
+                line = line.strip()
+                if line.startswith("Requires-Dist:"):
+                    # Extract dependency specification
+                    dep = line.split(":", 1)[1].strip()
+                    # Remove extras and environment markers
+                    dep = re.split(r"\s*;\s*", dep)[0]
+                    dep = re.split(r"\s*\[", dep)[0]
+                    dependencies.append(dep)
+
+    except Exception as e:
+        print(f"Error reading {wheel_path}: {e}", file=sys.stderr)
+        sys.exit(1)
+
+    return dependencies
+
+
+def main():
+    if len(sys.argv) != 3:
+        print("Usage: extract_wheel_deps.py <wheel_dir> <output_file>", file=sys.stderr)
+        sys.exit(1)
+
+    wheel_dir = Path(sys.argv[1])
+    output_file = Path(sys.argv[2])
+
+    # Find fastsafetensors wheels
+    wheel_files = list(wheel_dir.glob("fastsafetensors-*.whl"))
+
+    if not wheel_files:
+        print("Error: No fastsafetensors wheels found", file=sys.stderr)
+        sys.exit(1)
+
+    # Use first wheel (all should have same dependencies)
+    wheel_path = wheel_files[0]
+    print(f"Extracting dependencies from: {wheel_path.name}", file=sys.stderr)
+
+    deps = extract_dependencies(wheel_path)
+
+    # Write dependencies to output file
+    with open(output_file, "w") as f:
+        for dep in deps:
+            f.write(dep + "\n")
+
+    print(f"Extracted {len(deps)} dependencies to {output_file}", file=sys.stderr)
+
+
+if __name__ == "__main__":
+    main()

From 2b12a97cc40ebe690b4c1f0f656d54f2c0accf7e Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 06:01:11 +0000
Subject: [PATCH 39/48] only bundle the dependencies specified in the
 pyproject.toml

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/scripts/extract_wheel_deps.py   | 111 +++++++++++++++---------
 .github/workflows/publish-to-index.yaml |  42 +++++++--
 2 files changed, 107 insertions(+), 46 deletions(-)

diff --git a/.github/scripts/extract_wheel_deps.py b/.github/scripts/extract_wheel_deps.py
index 79eff27..f44dd94 100644
--- a/.github/scripts/extract_wheel_deps.py
+++ b/.github/scripts/extract_wheel_deps.py
@@ -1,42 +1,77 @@
 #!/usr/bin/env python3
-"""Extract dependencies from wheel METADATA file."""
+"""Extract dependencies from pyproject.toml for a specific version."""
 
-import sys
-import zipfile
 import re
+import sys
 from pathlib import Path
 
 
-def extract_dependencies(wheel_path):
-    """Extract Requires-Dist from wheel METADATA."""
+def parse_pyproject_toml(pyproject_path):
+    """Parse dependencies from pyproject.toml, excluding test dependencies."""
     dependencies = []
 
     try:
-        with zipfile.ZipFile(wheel_path, "r") as whl:
-            # Find METADATA file
-            metadata_files = [
-                f for f in whl.namelist() if f.endswith(".dist-info/METADATA")
-            ]
-
-            if not metadata_files:
-                print(f"Warning: No METADATA found in {wheel_path}", file=sys.stderr)
-                return dependencies
-
-            metadata_content = whl.read(metadata_files[0]).decode("utf-8")
-
-            # Parse Requires-Dist lines
-            for line in metadata_content.split("\n"):
-                line = line.strip()
-                if line.startswith("Requires-Dist:"):
-                    # Extract dependency specification
-                    dep = line.split(":", 1)[1].strip()
-                    # Remove extras and environment markers
-                    dep = re.split(r"\s*;\s*", dep)[0]
-                    dep = re.split(r"\s*\[", dep)[0]
-                    dependencies.append(dep)
+        with open(pyproject_path, "r") as f:
+            content = f.read()
+
+        # Find [project.dependencies] section
+        in_dependencies = False
+        in_optional_dependencies = False
+        bracket_count = 0
+
+        for line in content.split("\n"):
+            line_stripped = line.strip()
+
+            # Check if entering dependencies section
+            if line_stripped == "[project.dependencies]" or line_stripped.startswith(
+                "dependencies = ["
+            ):
+                in_dependencies = True
+                if "[" in line:
+                    bracket_count = line.count("[") - line.count("]")
+                continue
+
+            # Check if entering optional dependencies (skip these)
+            if (
+                "[project.optional-dependencies]" in line_stripped
+                or "[tool.poetry.group" in line_stripped
+            ):
+                in_dependencies = False
+                in_optional_dependencies = True
+                continue
+
+            # Exit sections when encountering new section header
+            if line_stripped.startswith("[") and line_stripped.endswith("]"):
+                in_dependencies = False
+                in_optional_dependencies = False
+                bracket_count = 0
+                continue
+
+            # Skip if in optional dependencies
+            if in_optional_dependencies:
+                continue
+
+            # Parse dependency lines
+            if in_dependencies:
+                # Track bracket balance for multiline arrays
+                bracket_count += line.count("[") - line.count("]")
+
+                # Extract dependency from quoted string
+                match = re.search(r'["\']([^"\']+)["\']', line)
+                if match:
+                    dep = match.group(1).strip()
+                    # Skip comments and empty lines
+                    if dep and not dep.startswith("#"):
+                        # Remove any trailing commas
+                        dep = dep.rstrip(",").strip()
+                        dependencies.append(dep)
+
+                # Check if array is closed
+                if bracket_count == 0:
+                    in_dependencies = False
 
     except Exception as e:
-        print(f"Error reading {wheel_path}: {e}", file=sys.stderr)
+        print(f"Error reading {pyproject_path}: {e}", file=sys.stderr)
         sys.exit(1)
 
     return dependencies
@@ -44,24 +79,22 @@ def extract_dependencies(wheel_path):
 
 def main():
     if len(sys.argv) != 3:
-        print("Usage: extract_wheel_deps.py <wheel_dir> <output_file>", file=sys.stderr)
+        print(
+            "Usage: extract_wheel_deps.py <pyproject_path> <output_file>",
+            file=sys.stderr,
+        )
         sys.exit(1)
 
-    wheel_dir = Path(sys.argv[1])
+    pyproject_path = Path(sys.argv[1])
     output_file = Path(sys.argv[2])
 
-    # Find fastsafetensors wheels
-    wheel_files = list(wheel_dir.glob("fastsafetensors-*.whl"))
-
-    if not wheel_files:
-        print("Error: No fastsafetensors wheels found", file=sys.stderr)
+    if not pyproject_path.exists():
+        print(f"Error: {pyproject_path} not found", file=sys.stderr)
         sys.exit(1)
 
-    # Use first wheel (all should have same dependencies)
-    wheel_path = wheel_files[0]
-    print(f"Extracting dependencies from: {wheel_path.name}", file=sys.stderr)
+    print(f"Extracting dependencies from: {pyproject_path}", file=sys.stderr)
 
-    deps = extract_dependencies(wheel_path)
+    deps = parse_pyproject_toml(pyproject_path)
 
     # Write dependencies to output file
     with open(output_file, "w") as f:
diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 89192f0..24dd104 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -133,23 +133,51 @@ jobs:
             cd ../..
           fi
 
-      - name: Extract dependencies from wheels
+      - name: Extract dependencies from pyproject.toml
         run: |
           PLATFORM="${{ steps.determine.outputs.platform }}"
           VERSION="${{ steps.determine.outputs.version }}"
 
+          # Determine version tag for ROCm/CUDA
+          get_version_tag() {
+            local platform=$1
+            local version="${VERSION}"
+            if [[ "${version}" == *"-${platform}"* ]]; then
+              echo "${version}"
+            else
+              echo "${version}-${platform}"
+            fi
+          }
+
           extract_deps_for_platform() {
             local platform=$1
-            local wheel_dir="wheels/${platform}"
+            local version_tag=$(get_version_tag "${platform}")
             local output_file="wheels/${platform}/requirements.txt"
 
-            if [ ! -d "${wheel_dir}" ]; then
-              echo "No wheels directory for ${platform}"
-              return
+            echo "Extracting dependencies for ${platform} from version ${version_tag}..."
+
+            # Checkout the specific version tag to get its pyproject.toml
+            cd fastsafetensors-rocm
+            git fetch --tags
+
+            if ! git checkout "${version_tag}" 2>/dev/null; then
+              echo "Warning: Could not checkout tag ${version_tag}, using current version"
+              git checkout -
+            fi
+
+            # Check if pyproject.toml exists
+            if [ ! -f "pyproject.toml" ]; then
+              echo "Error: pyproject.toml not found for version ${version_tag}"
+              cd ..
+              return 1
             fi
 
-            echo "Extracting dependencies from ${platform} wheels..."
-            python3 fastsafetensors-rocm/.github/scripts/extract_wheel_deps.py "${wheel_dir}" "${output_file}"
+            # Extract dependencies from pyproject.toml
+            python3 .github/scripts/extract_wheel_deps.py "pyproject.toml" "../${output_file}"
+
+            # Return to original branch/commit
+            git checkout -
+            cd ..
 
             echo "Extracted dependencies:"
             cat "${output_file}"

From f0ec845fda3098140c46361188bdcd03cdedd8a2 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 06:05:27 +0000
Subject: [PATCH 40/48] bugfix the workflow

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 18 ++++++++++++------
 1 file changed, 12 insertions(+), 6 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 24dd104..b925025 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -138,6 +138,9 @@ jobs:
           PLATFORM="${{ steps.determine.outputs.platform }}"
           VERSION="${{ steps.determine.outputs.version }}"
 
+          # Save absolute path to the extraction script (from current checkout)
+          SCRIPT_PATH="$(pwd)/fastsafetensors-rocm/.github/scripts/extract_wheel_deps.py"
+
           # Determine version tag for ROCm/CUDA
           get_version_tag() {
             local platform=$1
@@ -152,7 +155,7 @@ jobs:
           extract_deps_for_platform() {
             local platform=$1
             local version_tag=$(get_version_tag "${platform}")
-            local output_file="wheels/${platform}/requirements.txt"
+            local output_file="$(pwd)/wheels/${platform}/requirements.txt"
 
             echo "Extracting dependencies for ${platform} from version ${version_tag}..."
 
@@ -160,23 +163,26 @@ jobs:
             cd fastsafetensors-rocm
             git fetch --tags
 
+            # Save current commit
+            local current_ref=$(git rev-parse HEAD)
+
             if ! git checkout "${version_tag}" 2>/dev/null; then
               echo "Warning: Could not checkout tag ${version_tag}, using current version"
-              git checkout -
             fi
 
             # Check if pyproject.toml exists
             if [ ! -f "pyproject.toml" ]; then
               echo "Error: pyproject.toml not found for version ${version_tag}"
+              git checkout "${current_ref}"
               cd ..
               return 1
             fi
 
-            # Extract dependencies from pyproject.toml
-            python3 .github/scripts/extract_wheel_deps.py "pyproject.toml" "../${output_file}"
+            # Extract dependencies from pyproject.toml using script from current checkout
+            python3 "${SCRIPT_PATH}" "pyproject.toml" "${output_file}"
 
-            # Return to original branch/commit
-            git checkout -
+            # Return to original commit
+            git checkout "${current_ref}"
             cd ..
 
             echo "Extracted dependencies:"

From 52910315c7f89feb86b3d7e3ba720a277e91cc8d Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 06:16:25 +0000
Subject: [PATCH 41/48] fixing the publsih to index workflow

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 18 ++++++++++++------
 1 file changed, 12 insertions(+), 6 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index b925025..a50ec4c 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -138,8 +138,14 @@ jobs:
           PLATFORM="${{ steps.determine.outputs.platform }}"
           VERSION="${{ steps.determine.outputs.version }}"
 
-          # Save absolute path to the extraction script (from current checkout)
-          SCRIPT_PATH="$(pwd)/fastsafetensors-rocm/.github/scripts/extract_wheel_deps.py"
+          # Get absolute paths
+          WORKSPACE_DIR="$(pwd)"
+          SCRIPT_PATH="${WORKSPACE_DIR}/fastsafetensors-rocm/.github/scripts/extract_wheel_deps.py"
+          REPO_DIR="${WORKSPACE_DIR}/fastsafetensors-rocm"
+
+          echo "Workspace: ${WORKSPACE_DIR}"
+          echo "Script: ${SCRIPT_PATH}"
+          echo "Repo: ${REPO_DIR}"
 
           # Determine version tag for ROCm/CUDA
           get_version_tag() {
@@ -155,12 +161,12 @@ jobs:
           extract_deps_for_platform() {
             local platform=$1
             local version_tag=$(get_version_tag "${platform}")
-            local output_file="$(pwd)/wheels/${platform}/requirements.txt"
+            local output_file="${WORKSPACE_DIR}/wheels/${platform}/requirements.txt"
 
             echo "Extracting dependencies for ${platform} from version ${version_tag}..."
 
             # Checkout the specific version tag to get its pyproject.toml
-            cd fastsafetensors-rocm
+            cd "${REPO_DIR}"
             git fetch --tags
 
             # Save current commit
@@ -174,7 +180,7 @@ jobs:
             if [ ! -f "pyproject.toml" ]; then
               echo "Error: pyproject.toml not found for version ${version_tag}"
               git checkout "${current_ref}"
-              cd ..
+              cd "${WORKSPACE_DIR}"
               return 1
             fi
 
@@ -183,7 +189,7 @@ jobs:
 
             # Return to original commit
             git checkout "${current_ref}"
-            cd ..
+            cd "${WORKSPACE_DIR}"
 
             echo "Extracted dependencies:"
             cat "${output_file}"

From 1f2e60c6a1d9a562db115f2c4b7803398db4dd1d Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 06:20:30 +0000
Subject: [PATCH 42/48] fixing the publsih to index workflow

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 14 ++++++++++----
 1 file changed, 10 insertions(+), 4 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index a50ec4c..77d0e7d 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -140,11 +140,14 @@ jobs:
 
           # Get absolute paths
           WORKSPACE_DIR="$(pwd)"
-          SCRIPT_PATH="${WORKSPACE_DIR}/fastsafetensors-rocm/.github/scripts/extract_wheel_deps.py"
           REPO_DIR="${WORKSPACE_DIR}/fastsafetensors-rocm"
 
+          # Copy script to temp location so it survives git checkout
+          TEMP_SCRIPT="/tmp/extract_wheel_deps_$$.py"
+          cp "${REPO_DIR}/.github/scripts/extract_wheel_deps.py" "${TEMP_SCRIPT}"
+
           echo "Workspace: ${WORKSPACE_DIR}"
-          echo "Script: ${SCRIPT_PATH}"
+          echo "Temp script: ${TEMP_SCRIPT}"
           echo "Repo: ${REPO_DIR}"
 
           # Determine version tag for ROCm/CUDA
@@ -184,8 +187,8 @@ jobs:
               return 1
             fi
 
-            # Extract dependencies from pyproject.toml using script from current checkout
-            python3 "${SCRIPT_PATH}" "pyproject.toml" "${output_file}"
+            # Extract dependencies from pyproject.toml using script from temp location
+            python3 "${TEMP_SCRIPT}" "pyproject.toml" "${output_file}"
 
             # Return to original commit
             git checkout "${current_ref}"
@@ -203,6 +206,9 @@ jobs:
             extract_deps_for_platform "cuda"
           fi
 
+          # Cleanup temp script
+          rm -f "${TEMP_SCRIPT}"
+
       - name: Download all dependencies
         run: |
           PLATFORM="${{ steps.determine.outputs.platform }}"

From bf274a1204d420b583dffc2e47fd72bb13bc96cb Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 06:26:20 +0000
Subject: [PATCH 43/48] update workflow instruction

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 77d0e7d..60d68fc 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -4,17 +4,17 @@ on:
   workflow_dispatch:
     inputs:
       version:
-        description: 'Version to publish (e.g., v0.1.15-rocm or v0.1.15-cuda)'
+        description: 'Version to publish (e.g., v0.1.15)'
         required: true
       platform:
         description: 'Platform to publish (rocm, cuda, or both)'
         required: true
-        default: 'rocm'
+        default: 'both'
         type: choice
         options:
+          - both
           - rocm
           - cuda
-          - both
   release:
     types: [published]
 

From c5b48868c2bd7cb4cde9b7fef71f1aabf49fd3e6 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Fri, 7 Nov 2025 20:21:01 +0000
Subject: [PATCH 44/48] only allow publish to index be triggered manually

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/workflows/publish-to-index.yaml | 25 ++++---------------------
 1 file changed, 4 insertions(+), 21 deletions(-)

diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
index 60d68fc..1c5d9fb 100644
--- a/.github/workflows/publish-to-index.yaml
+++ b/.github/workflows/publish-to-index.yaml
@@ -15,8 +15,6 @@ on:
           - both
           - rocm
           - cuda
-  release:
-    types: [published]
 
 permissions:
   contents: write
@@ -53,26 +51,11 @@ jobs:
       - name: Determine platform and version
         id: determine
         run: |
-          # Determine version
-          if [ "${{ github.event_name }}" = "release" ]; then
-            VERSION="${{ github.event.release.tag_name }}"
-          else
-            VERSION="${{ github.event.inputs.version }}"
-          fi
-          echo "version=${VERSION}" >> $GITHUB_OUTPUT
+          # Get version and platform from workflow inputs
+          VERSION="${{ github.event.inputs.version }}"
+          PLATFORM="${{ github.event.inputs.platform }}"
 
-          # Determine platform from version tag or input
-          if [ "${{ github.event_name }}" = "release" ]; then
-            if [[ "${VERSION}" == *"rocm"* ]]; then
-              PLATFORM="rocm"
-            elif [[ "${VERSION}" == *"cuda"* ]]; then
-              PLATFORM="cuda"
-            else
-              PLATFORM="both"
-            fi
-          else
-            PLATFORM="${{ github.event.inputs.platform }}"
-          fi
+          echo "version=${VERSION}" >> $GITHUB_OUTPUT
           echo "platform=${PLATFORM}" >> $GITHUB_OUTPUT
 
           echo "Publishing version: ${VERSION}"

From d631e44705c40d872204f1d00c83ae60a0bc8dc8 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Mon, 10 Nov 2025 23:31:13 +0000
Subject: [PATCH 45/48] remove github workflow

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 .github/scripts/extract_wheel_deps.py    | 108 ------
 .github/workflows/build-rocm-wheels.yaml | 192 ----------
 .github/workflows/publish-to-index.yaml  | 465 -----------------------
 3 files changed, 765 deletions(-)
 delete mode 100644 .github/scripts/extract_wheel_deps.py
 delete mode 100644 .github/workflows/build-rocm-wheels.yaml
 delete mode 100644 .github/workflows/publish-to-index.yaml

diff --git a/.github/scripts/extract_wheel_deps.py b/.github/scripts/extract_wheel_deps.py
deleted file mode 100644
index f44dd94..0000000
--- a/.github/scripts/extract_wheel_deps.py
+++ /dev/null
@@ -1,108 +0,0 @@
-#!/usr/bin/env python3
-"""Extract dependencies from pyproject.toml for a specific version."""
-
-import re
-import sys
-from pathlib import Path
-
-
-def parse_pyproject_toml(pyproject_path):
-    """Parse dependencies from pyproject.toml, excluding test dependencies."""
-    dependencies = []
-
-    try:
-        with open(pyproject_path, "r") as f:
-            content = f.read()
-
-        # Find [project.dependencies] section
-        in_dependencies = False
-        in_optional_dependencies = False
-        bracket_count = 0
-
-        for line in content.split("\n"):
-            line_stripped = line.strip()
-
-            # Check if entering dependencies section
-            if line_stripped == "[project.dependencies]" or line_stripped.startswith(
-                "dependencies = ["
-            ):
-                in_dependencies = True
-                if "[" in line:
-                    bracket_count = line.count("[") - line.count("]")
-                continue
-
-            # Check if entering optional dependencies (skip these)
-            if (
-                "[project.optional-dependencies]" in line_stripped
-                or "[tool.poetry.group" in line_stripped
-            ):
-                in_dependencies = False
-                in_optional_dependencies = True
-                continue
-
-            # Exit sections when encountering new section header
-            if line_stripped.startswith("[") and line_stripped.endswith("]"):
-                in_dependencies = False
-                in_optional_dependencies = False
-                bracket_count = 0
-                continue
-
-            # Skip if in optional dependencies
-            if in_optional_dependencies:
-                continue
-
-            # Parse dependency lines
-            if in_dependencies:
-                # Track bracket balance for multiline arrays
-                bracket_count += line.count("[") - line.count("]")
-
-                # Extract dependency from quoted string
-                match = re.search(r'["\']([^"\']+)["\']', line)
-                if match:
-                    dep = match.group(1).strip()
-                    # Skip comments and empty lines
-                    if dep and not dep.startswith("#"):
-                        # Remove any trailing commas
-                        dep = dep.rstrip(",").strip()
-                        dependencies.append(dep)
-
-                # Check if array is closed
-                if bracket_count == 0:
-                    in_dependencies = False
-
-    except Exception as e:
-        print(f"Error reading {pyproject_path}: {e}", file=sys.stderr)
-        sys.exit(1)
-
-    return dependencies
-
-
-def main():
-    if len(sys.argv) != 3:
-        print(
-            "Usage: extract_wheel_deps.py <pyproject_path> <output_file>",
-            file=sys.stderr,
-        )
-        sys.exit(1)
-
-    pyproject_path = Path(sys.argv[1])
-    output_file = Path(sys.argv[2])
-
-    if not pyproject_path.exists():
-        print(f"Error: {pyproject_path} not found", file=sys.stderr)
-        sys.exit(1)
-
-    print(f"Extracting dependencies from: {pyproject_path}", file=sys.stderr)
-
-    deps = parse_pyproject_toml(pyproject_path)
-
-    # Write dependencies to output file
-    with open(output_file, "w") as f:
-        for dep in deps:
-            f.write(dep + "\n")
-
-    print(f"Extracted {len(deps)} dependencies to {output_file}", file=sys.stderr)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/.github/workflows/build-rocm-wheels.yaml b/.github/workflows/build-rocm-wheels.yaml
deleted file mode 100644
index 142ee78..0000000
--- a/.github/workflows/build-rocm-wheels.yaml
+++ /dev/null
@@ -1,192 +0,0 @@
-name: Build ROCm wheels
-
-on:
-  workflow_dispatch:
-
-jobs:
-  build-rocm-wheels:
-    name: Build ROCm wheel - Python ${{ matrix.python-version }}
-    runs-on: ubuntu-latest
-    container:
-      image: rocm/dev-ubuntu-24.04:7.0
-      options: --user root
-    strategy:
-      fail-fast: false
-      matrix:
-        python-version: ["3.9", "3.10", "3.11", "3.12", "3.13"]
-
-    steps:
-      - name: Checkout code
-        uses: actions/checkout@v4
-
-      - name: Install system dependencies
-        run: |
-          # Prevent interactive prompts during package installation
-          export DEBIAN_FRONTEND=noninteractive
-          export TZ=Etc/UTC
-
-          apt-get update
-          apt-get install -y \
-            software-properties-common \
-            wget \
-            build-essential \
-            libnuma-dev \
-            gcc \
-            g++ \
-            make \
-            git \
-            curl \
-            ca-certificates \
-            patchelf
-
-      - name: Install Python ${{ matrix.python-version }}
-        run: |
-          # Prevent interactive prompts during package installation
-          export DEBIAN_FRONTEND=noninteractive
-          export TZ=Etc/UTC
-
-          PY_VER="${{ matrix.python-version }}"
-
-          # Check if Python dev package is available in Ubuntu repos
-          apt-get update
-          if apt-cache show python${PY_VER}-dev 2>/dev/null | grep -q "Package: python${PY_VER}-dev"; then
-            echo "Installing Python ${PY_VER} from Ubuntu repositories"
-            apt-get install -y \
-              python${PY_VER} \
-              python${PY_VER}-dev \
-              python${PY_VER}-venv
-          else
-            # If not available in Ubuntu repos, install using pyenv
-            echo "Python ${PY_VER} not in Ubuntu repos, installing via pyenv from python.org"
-
-            # Install pyenv dependencies
-            apt-get install -y \
-              libssl-dev \
-              zlib1g-dev \
-              libbz2-dev \
-              libreadline-dev \
-              libsqlite3-dev \
-              libncursesw5-dev \
-              xz-utils \
-              tk-dev \
-              libxml2-dev \
-              libxmlsec1-dev \
-              libffi-dev \
-              liblzma-dev
-
-            # Install pyenv
-            export PYENV_ROOT="/root/.pyenv"
-            curl https://pyenv.run | bash
-            export PATH="$PYENV_ROOT/bin:$PATH"
-            eval "$(pyenv init -)"
-
-            # Install Python from official python.org releases
-            pyenv install ${PY_VER}
-            pyenv global ${PY_VER}
-
-            # Create symlink so python${PY_VER} command works
-            INSTALLED_VERSION=$(ls /root/.pyenv/versions/ | grep "^${PY_VER}")
-            ln -sf /root/.pyenv/versions/${INSTALLED_VERSION}/bin/python /usr/local/bin/python${PY_VER}
-            echo "Created symlink: /usr/local/bin/python${PY_VER} -> /root/.pyenv/versions/${INSTALLED_VERSION}/bin/python"
-          fi
-
-          # Verify installation
-          python${PY_VER} --version
-
-      - name: Create virtual environment and install build dependencies
-        run: |
-          PY_VER="${{ matrix.python-version }}"
-
-          # Create virtual environment
-          python${PY_VER} -m venv /opt/venv
-
-          # Activate venv and install dependencies
-          . /opt/venv/bin/activate
-
-          # Upgrade pip and install build tools
-          python -m pip install --upgrade pip setuptools wheel
-          python -m pip install build setuptools_scm pybind11 numpy auditwheel
-
-          # Verify
-          python --version
-          pip --version
-
-      - name: Set ROCm environment variables
-        run: |
-          echo "ROCM_PATH=/opt/rocm" >> $GITHUB_ENV
-          echo "HIP_PATH=/opt/rocm/hip" >> $GITHUB_ENV
-          echo "/opt/rocm/bin" >> $GITHUB_PATH
-          echo "/opt/rocm/hip/bin" >> $GITHUB_PATH
-          echo "/opt/venv/bin" >> $GITHUB_PATH
-
-          # Verify ROCm installation
-          ls -la /opt/rocm/ || echo "Warning: /opt/rocm not found"
-          hipify-perl --version || echo "Warning: hipify-perl not working"
-
-      - name: Build wheel for ROCm
-        run: |
-          # Activate venv
-          . /opt/venv/bin/activate
-
-          # The setup.py should detect ROCm and use hipify-perl automatically
-          python -m pip wheel . -w wheelhouse/ --no-deps -v
-        env:
-          ROCM_PATH: /opt/rocm
-          HIP_PATH: /opt/rocm/hip
-
-      - name: List built wheels
-        run: |
-          ls -lah wheelhouse/
-
-      - name: Repair wheel with auditwheel to create manylinux wheel
-        run: |
-          # Activate venv
-          . /opt/venv/bin/activate
-
-          # Use auditwheel to repair and convert to manylinux wheel
-          mkdir -p wheelhouse_repaired
-          for wheel in wheelhouse/*.whl; do
-            echo "Repairing wheel: $wheel"
-            auditwheel repair "$wheel" -w wheelhouse_repaired/ || {
-              echo "auditwheel repair failed, copying original wheel"
-              cp "$wheel" wheelhouse_repaired/
-            }
-          done
-
-          # Replace original wheelhouse with repaired wheels
-          rm -rf wheelhouse
-          mv wheelhouse_repaired wheelhouse
-
-          echo "Repaired wheels:"
-          ls -lah wheelhouse/
-
-      - name: Upload wheel artifact
-        uses: actions/upload-artifact@v4
-        with:
-          name: rocm-wheel-py${{ matrix.python-version }}
-          path: wheelhouse/*.whl
-          if-no-files-found: error
-
-  collect-wheels:
-    name: Collect all ROCm wheels
-    needs: build-rocm-wheels
-    runs-on: ubuntu-latest
-
-    steps:
-      - name: Download all wheel artifacts
-        uses: actions/download-artifact@v4
-        with:
-          path: all-wheels/
-          pattern: rocm-wheel-*
-          merge-multiple: true
-
-      - name: List all wheels
-        run: |
-          echo "Built ROCm wheels:"
-          ls -lah all-wheels/
-
-      - name: Upload combined artifact
-        uses: actions/upload-artifact@v4
-        with:
-          name: rocm-wheels-all
-          path: all-wheels/*.whl
diff --git a/.github/workflows/publish-to-index.yaml b/.github/workflows/publish-to-index.yaml
deleted file mode 100644
index 1c5d9fb..0000000
--- a/.github/workflows/publish-to-index.yaml
+++ /dev/null
@@ -1,465 +0,0 @@
-name: Publish wheels to custom index
-
-on:
-  workflow_dispatch:
-    inputs:
-      version:
-        description: 'Version to publish (e.g., v0.1.15)'
-        required: true
-      platform:
-        description: 'Platform to publish (rocm, cuda, or both)'
-        required: true
-        default: 'both'
-        type: choice
-        options:
-          - both
-          - rocm
-          - cuda
-
-permissions:
-  contents: write
-
-jobs:
-  publish-to-github-pages:
-    name: Publish to GitHub Pages index
-    runs-on: ubuntu-latest
-
-    steps:
-      - name: Checkout fastsafetensors-rocm repo
-        uses: actions/checkout@v4
-        with:
-          path: fastsafetensors-rocm
-
-      - name: Set up Python
-        uses: actions/setup-python@v5
-        with:
-          python-version: "3.12"
-
-      - name: Install tools
-        run: |
-          python -m pip install --upgrade pip
-          pip install dumb-pypi
-
-          # Install GitHub CLI
-          type -p curl >/dev/null || (sudo apt update && sudo apt install curl -y)
-          curl -fsSL https://cli.github.com/packages/githubcli-archive-keyring.gpg | sudo dd of=/usr/share/keyrings/githubcli-archive-keyring.gpg \
-          && sudo chmod go+r /usr/share/keyrings/githubcli-archive-keyring.gpg \
-          && echo "deb [arch=$(dpkg --print-architecture) signed-by=/usr/share/keyrings/githubcli-archive-keyring.gpg] https://cli.github.com/packages stable main" | sudo tee /etc/apt/sources.list.d/github-cli.list > /dev/null \
-          && sudo apt update \
-          && sudo apt install gh -y
-
-      - name: Determine platform and version
-        id: determine
-        run: |
-          # Get version and platform from workflow inputs
-          VERSION="${{ github.event.inputs.version }}"
-          PLATFORM="${{ github.event.inputs.platform }}"
-
-          echo "version=${VERSION}" >> $GITHUB_OUTPUT
-          echo "platform=${PLATFORM}" >> $GITHUB_OUTPUT
-
-          echo "Publishing version: ${VERSION}"
-          echo "Platform: ${PLATFORM}"
-
-      - name: Download wheels from release
-        env:
-          GH_TOKEN: ${{ github.token }}
-        run: |
-          VERSION="${{ steps.determine.outputs.version }}"
-          PLATFORM="${{ steps.determine.outputs.platform }}"
-
-          # Function to construct platform-specific version tag
-          get_version_tag() {
-            local platform=$1
-            local version="${VERSION}"
-
-            # If version already has platform suffix, use as-is
-            if [[ "${version}" == *"-${platform}"* ]]; then
-              echo "${version}"
-            else
-              # Otherwise append platform suffix
-              echo "${version}-${platform}"
-            fi
-          }
-
-          # Download ROCm wheels
-          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
-            ROCM_VERSION=$(get_version_tag "rocm")
-            mkdir -p wheels/rocm
-            echo "Downloading ROCm wheels from release ${ROCM_VERSION}"
-            cd wheels/rocm
-            if ! gh release download "${ROCM_VERSION}" \
-              --repo EmbeddedLLM/fastsafetensors-rocm \
-              --pattern "*.whl"; then
-              echo "ERROR: Failed to download ROCm wheels from ${ROCM_VERSION}"
-              exit 1
-            fi
-            echo "Downloaded wheels:"
-            ls -lah
-            cd ../..
-          fi
-
-          # Download CUDA wheels
-          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
-            CUDA_VERSION=$(get_version_tag "cuda")
-            mkdir -p wheels/cuda
-            echo "Downloading CUDA wheels from release ${CUDA_VERSION}"
-            cd wheels/cuda
-            if ! gh release download "${CUDA_VERSION}" \
-              --repo EmbeddedLLM/fastsafetensors-rocm \
-              --pattern "*.whl"; then
-              echo "ERROR: Failed to download CUDA wheels from ${CUDA_VERSION}"
-              exit 1
-            fi
-            echo "Downloaded wheels:"
-            ls -lah
-            cd ../..
-          fi
-
-      - name: Extract dependencies from pyproject.toml
-        run: |
-          PLATFORM="${{ steps.determine.outputs.platform }}"
-          VERSION="${{ steps.determine.outputs.version }}"
-
-          # Get absolute paths
-          WORKSPACE_DIR="$(pwd)"
-          REPO_DIR="${WORKSPACE_DIR}/fastsafetensors-rocm"
-
-          # Copy script to temp location so it survives git checkout
-          TEMP_SCRIPT="/tmp/extract_wheel_deps_$$.py"
-          cp "${REPO_DIR}/.github/scripts/extract_wheel_deps.py" "${TEMP_SCRIPT}"
-
-          echo "Workspace: ${WORKSPACE_DIR}"
-          echo "Temp script: ${TEMP_SCRIPT}"
-          echo "Repo: ${REPO_DIR}"
-
-          # Determine version tag for ROCm/CUDA
-          get_version_tag() {
-            local platform=$1
-            local version="${VERSION}"
-            if [[ "${version}" == *"-${platform}"* ]]; then
-              echo "${version}"
-            else
-              echo "${version}-${platform}"
-            fi
-          }
-
-          extract_deps_for_platform() {
-            local platform=$1
-            local version_tag=$(get_version_tag "${platform}")
-            local output_file="${WORKSPACE_DIR}/wheels/${platform}/requirements.txt"
-
-            echo "Extracting dependencies for ${platform} from version ${version_tag}..."
-
-            # Checkout the specific version tag to get its pyproject.toml
-            cd "${REPO_DIR}"
-            git fetch --tags
-
-            # Save current commit
-            local current_ref=$(git rev-parse HEAD)
-
-            if ! git checkout "${version_tag}" 2>/dev/null; then
-              echo "Warning: Could not checkout tag ${version_tag}, using current version"
-            fi
-
-            # Check if pyproject.toml exists
-            if [ ! -f "pyproject.toml" ]; then
-              echo "Error: pyproject.toml not found for version ${version_tag}"
-              git checkout "${current_ref}"
-              cd "${WORKSPACE_DIR}"
-              return 1
-            fi
-
-            # Extract dependencies from pyproject.toml using script from temp location
-            python3 "${TEMP_SCRIPT}" "pyproject.toml" "${output_file}"
-
-            # Return to original commit
-            git checkout "${current_ref}"
-            cd "${WORKSPACE_DIR}"
-
-            echo "Extracted dependencies:"
-            cat "${output_file}"
-          }
-
-          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
-            extract_deps_for_platform "rocm"
-          fi
-
-          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
-            extract_deps_for_platform "cuda"
-          fi
-
-          # Cleanup temp script
-          rm -f "${TEMP_SCRIPT}"
-
-      - name: Download all dependencies
-        run: |
-          PLATFORM="${{ steps.determine.outputs.platform }}"
-
-          # Function to download dependencies for a platform
-          download_deps() {
-            local platform=$1
-            local dest_dir="wheels/${platform}"
-            local req_file="${dest_dir}/requirements.txt"
-
-            echo "Downloading dependencies for ${platform}..."
-
-            if [ ! -f "${req_file}" ]; then
-              echo "No requirements file found for ${platform}, skipping"
-              return
-            fi
-
-            # For each Python version, download dependencies
-            for py_ver in 3.9 3.10 3.11 3.12 3.13; do
-              echo "Downloading dependencies for Python ${py_ver}"
-
-              # Download dependencies using extracted requirements
-              python -m pip download \
-                --dest "${dest_dir}" \
-                --only-binary :all: \
-                --python-version ${py_ver} \
-                --platform manylinux2014_x86_64 \
-                --platform manylinux_2_17_x86_64 \
-                --platform manylinux_2_27_x86_64 \
-                --platform manylinux_2_28_x86_64 \
-                -r "${req_file}" 2>/dev/null || echo "Some downloads failed for Python ${py_ver}"
-            done
-
-            # Also download using current Python for any missing wheels
-            python -m pip download \
-              --dest "${dest_dir}" \
-              --only-binary :all: \
-              -r "${req_file}" || true
-
-            # Summary
-            if [ -d "${dest_dir}" ] && [ "$(ls -A ${dest_dir}/*.whl 2>/dev/null)" ]; then
-              echo "Total wheels collected for ${platform}:"
-              ls -1 "${dest_dir}"/*.whl | wc -l
-
-              echo "Wheel breakdown by package:"
-              ls -1 "${dest_dir}"/*.whl | xargs -n1 basename | sed 's/-[0-9].*//' | sort | uniq -c
-            fi
-          }
-
-          # Download for requested platforms
-          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
-            download_deps "rocm"
-          fi
-
-          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
-            download_deps "cuda"
-          fi
-
-      - name: Checkout GitHub Pages repository
-        uses: actions/checkout@v4
-        with:
-          repository: EmbeddedLLM/fastsafetensors-rocm
-          ref: gh-pages
-          token: ${{ secrets.GITHUB_TOKEN }}
-          path: gh-pages-repo
-
-      - name: Copy wheels and generate index
-        run: |
-          cd gh-pages-repo
-          PLATFORM="${{ steps.determine.outputs.platform }}"
-          VERSION="${{ steps.determine.outputs.version }}"
-
-          # Function to generate index for a platform
-          generate_index() {
-            local platform=$1
-            local version="${VERSION}"
-
-            echo "Generating index for ${platform}..."
-
-            # Clean up old index files to avoid conflicts
-            rm -rf "${platform}/simple"
-            rm -f "${platform}/package-list.txt"
-            rm -f "${platform}/index.html"
-            rm -f "${platform}/packages.json"
-
-            # Create directory structure
-            mkdir -p "${platform}/packages"
-            mkdir -p "${platform}/manifests"
-
-            # Copy all wheels
-            if [ -d "../wheels/${platform}" ] && [ "$(ls -A ../wheels/${platform}/*.whl 2>/dev/null)" ]; then
-              # Extract version number (remove 'v' prefix if present)
-              local clean_version="${version#v}"
-
-              # Remove OLD wheels for the SAME version only
-              echo "Removing old fastsafetensors-${clean_version} wheels..."
-              rm -f "${platform}/packages/fastsafetensors-${clean_version}"-*.whl || true
-
-              # Copy new wheels
-              echo "Copying new wheels..."
-              cp ../wheels/${platform}/*.whl "${platform}/packages/"
-
-              # Generate package list with just filenames (dumb-pypi doesn't accept paths with /)
-              (cd "${platform}/packages" && ls *.whl) > "${platform}/package-list.txt"
-
-              echo "Package list contents:"
-              cat "${platform}/package-list.txt"
-
-              # Create manifest for this version
-              echo "Creating manifest for version ${clean_version}..."
-              local manifest_file="${platform}/manifests/v${clean_version}.json"
-
-              # Read dependencies from requirements.txt
-              local deps_json="[]"
-              if [ -f "../wheels/${platform}/requirements.txt" ]; then
-                deps_json=$(python3 -c 'import json,sys; print(json.dumps([line.strip() for line in open("../wheels/'${platform}'/requirements.txt") if line.strip() and not line.startswith("#")]))')
-              fi
-
-              # List fastsafetensors wheels
-              local fst_wheels_json=$(cd "${platform}/packages" && python3 -c 'import json,glob; print(json.dumps(sorted(glob.glob("fastsafetensors-'${clean_version}'-*.whl"))))')
-
-              # List all downloaded wheels
-              local all_wheels_json=$(cd "${platform}/packages" && python3 -c 'import json,glob; print(json.dumps(sorted(glob.glob("*.whl"))))')
-
-              # Create manifest JSON using Python
-              python3 -c "import json,sys; manifest={'fastsafetensors_version':'${clean_version}','published_at':'$(date -u +%Y-%m-%dT%H:%M:%SZ)','platform':'${platform}','dependencies':${deps_json},'fastsafetensors_wheels':${fst_wheels_json},'total_wheels_in_index':len(${all_wheels_json})}; json.dump(manifest,open('${manifest_file}','w'),indent=2)"
-
-              echo "Created manifest:"
-              cat "${manifest_file}"
-
-              # Generate PEP 503 compliant index
-              # Note: dumb-pypi expects wheel files to be accessible from where it runs
-              # Run from packages/ directory so dumb-pypi can find the wheels by filename
-              # packages-url is relative from simple/fastsafetensors/ to packages/: ../../packages
-              (cd "${platform}/packages" && \
-                dumb-pypi \
-                  --package-list ../package-list.txt \
-                  --packages-url ../../packages \
-                  --output-dir .. \
-                  --title "fastsafetensors ${platform^^} Index")
-
-              echo "Generated ${platform} index for $(ls ${platform}/packages/*.whl | wc -l) wheels"
-
-              # Debug: show generated structure
-              echo "Generated structure:"
-              ls -la "${platform}/simple/" || echo "No simple/ directory created"
-              ls -la "${platform}/simple/fastsafetensors/" || echo "No fastsafetensors/ directory created"
-            else
-              echo "No wheels found for ${platform}, skipping index generation"
-            fi
-          }
-
-          # Generate for requested platforms
-          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
-            generate_index "rocm"
-          fi
-
-          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
-            generate_index "cuda"
-          fi
-
-      - name: Create index READMEs
-        run: |
-          cd gh-pages-repo
-          PLATFORM="${{ steps.determine.outputs.platform }}"
-
-          # Function to create README for a platform
-          create_readme() {
-            local platform=$1
-            local platform_upper=$(echo $platform | tr '[:lower:]' '[:upper:]')
-
-            if [ ! -d "${platform}/packages" ] || [ ! "$(ls -A ${platform}/packages/*.whl 2>/dev/null)" ]; then
-              echo "No packages for ${platform}, skipping README"
-              return
-            fi
-
-            cat > "${platform}/README.md" << EOF
-          # fastsafetensors ${platform_upper} Package Index
-
-          This is a custom Python package index for ${platform_upper}-built fastsafetensors wheels.
-
-          ## Installation
-
-          \`\`\`bash
-          # Install fastsafetensors with ${platform_upper} support
-          pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/${platform}/simple/
-          \`\`\`
-
-          ## Available Packages
-
-          This index includes:
-          - \`fastsafetensors\` - ${platform_upper} builds for Python 3.9-3.13
-          - All dependencies (typer, click, etc.) for multiple Python versions and platforms
-
-          ## What's Included
-
-          EOF
-
-            # List packages with counts
-            echo "### Package Inventory" >> "${platform}/README.md"
-            echo "" >> "${platform}/README.md"
-            ls "${platform}/packages"/*.whl | sed 's/.*\///' | sed 's/-[0-9].*//' | sort | uniq -c | awk '{print "- " $2 ": " $1 " wheels"}' >> "${platform}/README.md"
-          }
-
-          # Create READMEs for requested platforms
-          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
-            create_readme "rocm"
-          fi
-
-          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
-            create_readme "cuda"
-          fi
-
-      - name: Commit and push to gh-pages
-        run: |
-          cd gh-pages-repo
-          PLATFORM="${{ steps.determine.outputs.platform }}"
-
-          git config user.name "GitHub Actions"
-          git config user.email "actions@github.com"
-
-          # Add platform directories based on selection
-          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
-            git add rocm/
-          fi
-
-          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
-            git add cuda/
-          fi
-
-          if git diff --staged --quiet; then
-            echo "No changes to commit"
-          else
-            if [ "$PLATFORM" = "both" ]; then
-              git commit -m "Update ROCm and CUDA indices - $(date +%Y-%m-%d)"
-            elif [ "$PLATFORM" = "cuda" ]; then
-              git commit -m "Update CUDA index - $(date +%Y-%m-%d)"
-            else
-              git commit -m "Update ROCm index - $(date +%Y-%m-%d)"
-            fi
-            git push
-            echo "Successfully pushed to gh-pages branch"
-          fi
-
-      - name: Summary
-        run: |
-          PLATFORM="${{ steps.determine.outputs.platform }}"
-
-          echo "## Published to GitHub Pages! 🎉" >> $GITHUB_STEP_SUMMARY
-          echo "" >> $GITHUB_STEP_SUMMARY
-
-          if [ "$PLATFORM" = "rocm" ] || [ "$PLATFORM" = "both" ]; then
-            echo "### ROCm Index" >> $GITHUB_STEP_SUMMARY
-            echo "Index URL: https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/" >> $GITHUB_STEP_SUMMARY
-            echo "" >> $GITHUB_STEP_SUMMARY
-            echo "**Installation:**" >> $GITHUB_STEP_SUMMARY
-            echo '```bash' >> $GITHUB_STEP_SUMMARY
-            echo "pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/rocm/simple/" >> $GITHUB_STEP_SUMMARY
-            echo '```' >> $GITHUB_STEP_SUMMARY
-            echo "" >> $GITHUB_STEP_SUMMARY
-          fi
-
-          if [ "$PLATFORM" = "cuda" ] || [ "$PLATFORM" = "both" ]; then
-            echo "### CUDA Index" >> $GITHUB_STEP_SUMMARY
-            echo "Index URL: https://embeddedllm.github.io/fastsafetensors-rocm/cuda/simple/" >> $GITHUB_STEP_SUMMARY
-            echo "" >> $GITHUB_STEP_SUMMARY
-            echo "**Installation:**" >> $GITHUB_STEP_SUMMARY
-            echo '```bash' >> $GITHUB_STEP_SUMMARY
-            echo "pip install fastsafetensors --index-url https://embeddedllm.github.io/fastsafetensors-rocm/cuda/simple/" >> $GITHUB_STEP_SUMMARY
-            echo '```' >> $GITHUB_STEP_SUMMARY
-          fi

From e353538e433673fc1380de4477e718f700dc3c6a Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Mon, 10 Nov 2025 23:55:51 +0000
Subject: [PATCH 46/48] update installation procedure on ROCm

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 README.md | 12 +++++++++---
 1 file changed, 9 insertions(+), 3 deletions(-)

diff --git a/README.md b/README.md
index c692e10..e50d967 100644
--- a/README.md
+++ b/README.md
@@ -66,11 +66,17 @@ pip install .
 
 ## For ROCm
 
-### Install from source
-
 On ROCm, there are not GDS equivalent support. So fastsafetensors support only supports `nogds=True` mode.
 The performance gain example can be found at [amd-perf.md](./docs/amd-perf.md)
 
+### Install from Github Source
+
 ```bash
-python3 setup.py develop
+python3 -m pip install git+https://github.com/foundation-model-stack/fastsafetensors.git
+```
+
+### Install from source
+
+```bash
+pip install .
 ```

From 8fd8b99c04b939edf02ae98844e6b1a5e832dd80 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Mon, 10 Nov 2025 23:56:23 +0000
Subject: [PATCH 47/48] fix installation command

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index e50d967..4d58823 100644
--- a/README.md
+++ b/README.md
@@ -72,7 +72,7 @@ The performance gain example can be found at [amd-perf.md](./docs/amd-perf.md)
 ### Install from Github Source
 
 ```bash
-python3 -m pip install git+https://github.com/foundation-model-stack/fastsafetensors.git
+pip install git+https://github.com/foundation-model-stack/fastsafetensors.git
 ```
 
 ### Install from source

From 82fba39009f96d5469a38d79f15f866e7fe99d09 Mon Sep 17 00:00:00 2001
From: tjtanaa <tunjian.tan@embeddedllm.com>
Date: Tue, 11 Nov 2025 06:48:36 +0000
Subject: [PATCH 48/48] fix enum for HIP

Signed-off-by: tjtanaa <tunjian.tan@embeddedllm.com>
---
 fastsafetensors/cpp/ext.hpp | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/fastsafetensors/cpp/ext.hpp b/fastsafetensors/cpp/ext.hpp
index 961011f..770d3a1 100644
--- a/fastsafetensors/cpp/ext.hpp
+++ b/fastsafetensors/cpp/ext.hpp
@@ -39,7 +39,12 @@ typedef struct CUfileError { CUfileOpError err; } CUfileError_t;
 // Define minimal CUDA/HIP types for both platforms to avoid compile-time dependencies
 // We load all GPU functions dynamically at runtime via dlopen()
 typedef enum cudaError { cudaSuccess = 0, cudaErrorMemoryAllocation = 2 } cudaError_t;
+// Platform-specific enum values - CUDA and HIP have different values for HostToDevice
+#ifdef USE_ROCM
+enum cudaMemcpyKind { cudaMemcpyHostToDevice=1, cudaMemcpyDefault = 4 };
+#else
 enum cudaMemcpyKind { cudaMemcpyHostToDevice=2, cudaMemcpyDefault = 4 };
+#endif
 
 
 typedef enum CUfileFeatureFlags {