LICENSE
MANIFEST.in
README.md
requirements.txt
setup.py
gptqmodel/__init__.py
gptqmodel/version.py
gptqmodel.egg-info/PKG-INFO
gptqmodel.egg-info/SOURCES.txt
gptqmodel.egg-info/dependency_links.txt
gptqmodel.egg-info/requires.txt
gptqmodel.egg-info/top_level.txt
gptqmodel/adapter/__init__.py
gptqmodel/adapter/adapter.py
gptqmodel/adapter/peft.py
gptqmodel/adapter/remote.py
gptqmodel/eora/__init__.py
gptqmodel/eora/eora.py
gptqmodel/looper/__init__.py
gptqmodel/looper/dequantize_processor.py
gptqmodel/looper/eora_processor.py
gptqmodel/looper/gptq_processor.py
gptqmodel/looper/input_cache.py
gptqmodel/looper/loop_processor.py
gptqmodel/looper/module_looper.py
gptqmodel/looper/named_module.py
gptqmodel/looper/qqq_processor.py
gptqmodel/models/__init__.py
gptqmodel/models/_const.py
gptqmodel/models/auto.py
gptqmodel/models/base.py
gptqmodel/models/loader.py
gptqmodel/models/writer.py
gptqmodel/models/definitions/__init__.py
gptqmodel/models/definitions/baichuan.py
gptqmodel/models/definitions/bloom.py
gptqmodel/models/definitions/chatglm.py
gptqmodel/models/definitions/codegen.py
gptqmodel/models/definitions/cohere.py
gptqmodel/models/definitions/cohere2.py
gptqmodel/models/definitions/dbrx.py
gptqmodel/models/definitions/dbrx_converted.py
gptqmodel/models/definitions/decilm.py
gptqmodel/models/definitions/deepseek_v2.py
gptqmodel/models/definitions/deepseek_v3.py
gptqmodel/models/definitions/exaone.py
gptqmodel/models/definitions/gemma.py
gptqmodel/models/definitions/gemma2.py
gptqmodel/models/definitions/gemma3.py
gptqmodel/models/definitions/glm.py
gptqmodel/models/definitions/gpt2.py
gptqmodel/models/definitions/gpt_bigcode.py
gptqmodel/models/definitions/gpt_neox.py
gptqmodel/models/definitions/gptj.py
gptqmodel/models/definitions/granite.py
gptqmodel/models/definitions/grinmoe.py
gptqmodel/models/definitions/hymba.py
gptqmodel/models/definitions/instella.py
gptqmodel/models/definitions/internlm.py
gptqmodel/models/definitions/internlm2.py
gptqmodel/models/definitions/llama.py
gptqmodel/models/definitions/longllama.py
gptqmodel/models/definitions/minicpm.py
gptqmodel/models/definitions/minicpm3.py
gptqmodel/models/definitions/mistral.py
gptqmodel/models/definitions/mixtral.py
gptqmodel/models/definitions/mllama.py
gptqmodel/models/definitions/mobilellm.py
gptqmodel/models/definitions/moss.py
gptqmodel/models/definitions/mpt.py
gptqmodel/models/definitions/olmo2.py
gptqmodel/models/definitions/opt.py
gptqmodel/models/definitions/ovis.py
gptqmodel/models/definitions/phi.py
gptqmodel/models/definitions/phi3.py
gptqmodel/models/definitions/qwen.py
gptqmodel/models/definitions/qwen2.py
gptqmodel/models/definitions/qwen2_moe.py
gptqmodel/models/definitions/qwen2_vl.py
gptqmodel/models/definitions/rw.py
gptqmodel/models/definitions/stablelmepoch.py
gptqmodel/models/definitions/starcoder2.py
gptqmodel/models/definitions/telechat2.py
gptqmodel/models/definitions/xverse.py
gptqmodel/models/definitions/yi.py
gptqmodel/nn_modules/__init__.py
gptqmodel/nn_modules/hooked_linear.py
gptqmodel/nn_modules/qlinear/__init__.py
gptqmodel/nn_modules/qlinear/bitblas.py
gptqmodel/nn_modules/qlinear/bitblas_target_detector.py
gptqmodel/nn_modules/qlinear/exllama.py
gptqmodel/nn_modules/qlinear/exllama_eora.py
gptqmodel/nn_modules/qlinear/exllamav2.py
gptqmodel/nn_modules/qlinear/ipex.py
gptqmodel/nn_modules/qlinear/marlin.py
gptqmodel/nn_modules/qlinear/qqq.py
gptqmodel/nn_modules/qlinear/torch.py
gptqmodel/nn_modules/qlinear/tritonv2.py
gptqmodel/nn_modules/qlinear/utils.py
gptqmodel/nn_modules/triton_utils/__init__.py
gptqmodel/nn_modules/triton_utils/custom_autotune.py
gptqmodel/nn_modules/triton_utils/dequant.py
gptqmodel/nn_modules/triton_utils/kernels.py
gptqmodel/nn_modules/triton_utils/mixin.py
gptqmodel/quantization/__init__.py
gptqmodel/quantization/config.py
gptqmodel/quantization/gptq.py
gptqmodel/quantization/qqq.py
gptqmodel/quantization/quantizer.py
gptqmodel/quantization/rotation/__init__.py
gptqmodel/quantization/rotation/hadamard_utils.py
gptqmodel/quantization/rotation/rotation.py
gptqmodel/utils/__init__.py
gptqmodel/utils/backend.py
gptqmodel/utils/bitblas.py
gptqmodel/utils/calibration.py
gptqmodel/utils/data.py
gptqmodel/utils/device.py
gptqmodel/utils/eval.py
gptqmodel/utils/evalplus.py
gptqmodel/utils/exllama.py
gptqmodel/utils/hf.py
gptqmodel/utils/image.py
gptqmodel/utils/importer.py
gptqmodel/utils/logger.py
gptqmodel/utils/marlin.py
gptqmodel/utils/mlx.py
gptqmodel/utils/mmlupro.py
gptqmodel/utils/model.py
gptqmodel/utils/openai_server.py
gptqmodel/utils/perplexity.py
gptqmodel/utils/plotly.py
gptqmodel/utils/rocm.py
gptqmodel/utils/safetensor.py
gptqmodel/utils/sglang.py
gptqmodel/utils/tensor.py
gptqmodel/utils/terminal.py
gptqmodel/utils/torch.py
gptqmodel/utils/vllm.py
gptqmodel/utils/vram.py
gptqmodel_ext/exllama/cu_compat.cuh
gptqmodel_ext/exllama/cuda_buffers.cu
gptqmodel_ext/exllama/cuda_buffers.cuh
gptqmodel_ext/exllama/exllama_ext.cpp
gptqmodel_ext/exllama/hip_compat.cuh
gptqmodel_ext/exllama/matrix.cuh
gptqmodel_ext/exllama/tuning.h
gptqmodel_ext/exllama/util.cuh
gptqmodel_ext/exllama/cuda_func/column_remap.cu
gptqmodel_ext/exllama/cuda_func/column_remap.cuh
gptqmodel_ext/exllama/cuda_func/q4_matmul.cu
gptqmodel_ext/exllama/cuda_func/q4_matmul.cuh
gptqmodel_ext/exllama/cuda_func/q4_matrix.cu
gptqmodel_ext/exllama/cuda_func/q4_matrix.cuh
gptqmodel_ext/exllama_eora/benchmark.py
gptqmodel_ext/exllama_eora/setup.py
gptqmodel_ext/exllama_eora/test_actual_value.py
gptqmodel_ext/exllama_eora/test_eora.py
gptqmodel_ext/exllama_eora/test_eora_sweep.py
gptqmodel_ext/exllama_eora/eora/__init__.py
gptqmodel_ext/exllama_eora/eora/compat.cuh
gptqmodel_ext/exllama_eora/eora/matrix_view.cuh
gptqmodel_ext/exllama_eora/eora/ops.h
gptqmodel_ext/exllama_eora/eora/pybind.cu
gptqmodel_ext/exllama_eora/eora/q_gemm.cu
gptqmodel_ext/exllama_eora/eora/q_gemm_original.cu
gptqmodel_ext/exllama_eora/eora/qdq_2.cuh
gptqmodel_ext/exllama_eora/eora/qdq_3.cuh
gptqmodel_ext/exllama_eora/eora/qdq_4.cuh
gptqmodel_ext/exllama_eora/eora/qdq_8.cuh
gptqmodel_ext/exllama_eora/eora/qdq_util.cuh
gptqmodel_ext/exllamav2/config.h
gptqmodel_ext/exllamav2/ext.cpp
gptqmodel_ext/exllamav2/cpp/util.h
gptqmodel_ext/exllamav2/cuda/compat.cuh
gptqmodel_ext/exllamav2/cuda/compat_gemm.cuh
gptqmodel_ext/exllamav2/cuda/matrix_view.cuh
gptqmodel_ext/exllamav2/cuda/q_gemm.cu
gptqmodel_ext/exllamav2/cuda/q_gemm.cuh
gptqmodel_ext/exllamav2/cuda/q_gemm_kernel.cuh
gptqmodel_ext/exllamav2/cuda/q_gemm_kernel_gptq.cuh
gptqmodel_ext/exllamav2/cuda/q_matrix.cu
gptqmodel_ext/exllamav2/cuda/q_matrix.cuh
gptqmodel_ext/exllamav2/cuda/util.cuh
gptqmodel_ext/exllamav2/cuda/quant/qdq_2.cuh
gptqmodel_ext/exllamav2/cuda/quant/qdq_3.cuh
gptqmodel_ext/exllamav2/cuda/quant/qdq_4.cuh
gptqmodel_ext/exllamav2/cuda/quant/qdq_5.cuh
gptqmodel_ext/exllamav2/cuda/quant/qdq_6.cuh
gptqmodel_ext/exllamav2/cuda/quant/qdq_8.cuh
gptqmodel_ext/exllamav2/cuda/quant/qdq_util.cuh
gptqmodel_ext/marlin/marlin.cuh
gptqmodel_ext/marlin/marlin_cuda.cpp
gptqmodel_ext/marlin/marlin_cuda_kernel.cu
gptqmodel_ext/marlin/marlin_cuda_kernel.cuh
gptqmodel_ext/marlin/marlin_dtypes.cuh
gptqmodel_ext/marlin/marlin_repack.cu
gptqmodel_ext/marlin/marlin_repack.cuh
gptqmodel_ext/qqq/qqq.cpp
gptqmodel_ext/qqq/qqq_gemm.cu
gptqmodel_ext/qqq/qqq_gemm.h