122 lines
3.7 KiB
Nix
122 lines
3.7 KiB
Nix
{
|
|
lib,
|
|
stdenv,
|
|
buildPythonPackage,
|
|
fetchFromGitHub,
|
|
pythonAtLeast,
|
|
|
|
# build-system
|
|
setuptools,
|
|
setuptools-scm,
|
|
llvmPackages,
|
|
|
|
# dependencies
|
|
frozendict,
|
|
loguru,
|
|
pydantic,
|
|
torch,
|
|
transformers,
|
|
|
|
# tests
|
|
nbconvert,
|
|
nbformat,
|
|
pytestCheckHook,
|
|
}:
|
|
|
|
buildPythonPackage (finalAttrs: {
|
|
pname = "compressed-tensors";
|
|
version = "0.14.0";
|
|
pyproject = true;
|
|
|
|
# Release on PyPI is missing the `utils` directory, which `setup.py` wants to import
|
|
src = fetchFromGitHub {
|
|
owner = "neuralmagic";
|
|
repo = "compressed-tensors";
|
|
tag = finalAttrs.version;
|
|
hash = "sha256-auiVCTL4WpfaD2cwdG3kt08+nW77T/txWZP4SAW00mk=";
|
|
};
|
|
|
|
postPatch = ''
|
|
substituteInPlace pyproject.toml \
|
|
--replace-fail "setuptools_scm==8.2.0" "setuptools_scm"
|
|
'';
|
|
|
|
build-system = [
|
|
setuptools
|
|
setuptools-scm
|
|
];
|
|
|
|
buildInputs = lib.optional stdenv.cc.isClang llvmPackages.openmp;
|
|
|
|
dependencies = [
|
|
frozendict
|
|
loguru
|
|
pydantic
|
|
torch
|
|
transformers
|
|
];
|
|
|
|
pythonRelaxDeps = [ "transformers" ];
|
|
|
|
doCheck = true;
|
|
|
|
pythonImportsCheck = [ "compressed_tensors" ];
|
|
|
|
nativeCheckInputs = [
|
|
nbconvert
|
|
nbformat
|
|
pytestCheckHook
|
|
];
|
|
|
|
disabledTests = [
|
|
# these try to download models from HF Hub
|
|
"test_apply_tinyllama_dynamic_activations"
|
|
"test_compress_model"
|
|
"test_compress_model_meta"
|
|
"test_compressed_linear_from_linear_usage"
|
|
"test_decompress_model"
|
|
"test_get_observer_token_count"
|
|
"test_kv_cache_quantization"
|
|
"test_load_compressed_sharded"
|
|
"test_model_forward_pass"
|
|
"test_save_compressed_model"
|
|
"test_target_prioritization"
|
|
"test_expand_targets_with_llama_stories"
|
|
|
|
# AssertionError: Torch not compiled with CUDA enabled
|
|
"test_register_parameter"
|
|
"test_register_parameter_invalidates"
|
|
"test_set_item"
|
|
"test_set_item_buffers"
|
|
"test_update_offload_parameter_with_grad"
|
|
];
|
|
|
|
disabledTestPaths = [
|
|
# these try to download models from HF Hub
|
|
"tests/test_quantization/lifecycle/test_apply.py"
|
|
# RuntimeError: The weights trying to be saved contained shared tensors
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[True-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[True-random-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[False-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[False-random-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[False-True-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[False-True-random-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[False-False-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[False-False-random-hadamard]"
|
|
|
|
# AssertionError: Torch not compiled with CUDA enabled
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[True-True-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[True-True-random-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[True-False-hadamard]"
|
|
"tests/test_transform/factory/test_serialization.py::test_serialization[True-False-random-hadamard]"
|
|
];
|
|
|
|
meta = {
|
|
description = "Safetensors extension to efficiently store sparse quantized tensors on disk";
|
|
homepage = "https://github.com/neuralmagic/compressed-tensors";
|
|
changelog = "https://github.com/neuralmagic/compressed-tensors/releases/tag/${finalAttrs.src.tag}";
|
|
license = lib.licenses.asl20;
|
|
maintainers = with lib.maintainers; [ sarahec ];
|
|
};
|
|
})
|