MANIFEST.in
README.md
pyproject.toml
setup.py
src/isagellm_core.egg-info/PKG-INFO
src/isagellm_core.egg-info/SOURCES.txt
src/isagellm_core.egg-info/dependency_links.txt
src/isagellm_core.egg-info/entry_points.txt
src/isagellm_core.egg-info/requires.txt
src/isagellm_core.egg-info/top_level.txt
src/sagellm_core/__init__.py
src/sagellm_core/__init__.pyc
src/sagellm_core/__main__.pyc
src/sagellm_core/_version.py
src/sagellm_core/_version.pyc
src/sagellm_core/config.pyc
src/sagellm_core/demo.pyc
src/sagellm_core/embedding_server.pyc
src/sagellm_core/engine.pyc
src/sagellm_core/engine_factory.pyc
src/sagellm_core/engine_server.pyc
src/sagellm_core/factory.pyc
src/sagellm_core/health.pyc
src/sagellm_core/llm_engine.pyc
src/sagellm_core/pd_executor.pyc
src/sagellm_core/plugins.pyc
src/sagellm_core/py.typed
src/sagellm_core/runner.pyc
src/sagellm_core/runtime.pyc
src/sagellm_core/runtime_optimizer.pyc
src/sagellm_core/workload.pyc
src/sagellm_core/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/__pycache__/__main__.cpython-311.pyc
src/sagellm_core/__pycache__/config.cpython-310.pyc
src/sagellm_core/__pycache__/config.cpython-311.pyc
src/sagellm_core/__pycache__/demo.cpython-310.pyc
src/sagellm_core/__pycache__/demo.cpython-311.pyc
src/sagellm_core/__pycache__/embedding_server.cpython-311.pyc
src/sagellm_core/__pycache__/engine.cpython-310.pyc
src/sagellm_core/__pycache__/engine.cpython-311.pyc
src/sagellm_core/__pycache__/engine_factory.cpython-310.pyc
src/sagellm_core/__pycache__/engine_factory.cpython-311.pyc
src/sagellm_core/__pycache__/engine_server.cpython-310.pyc
src/sagellm_core/__pycache__/engine_server.cpython-311.pyc
src/sagellm_core/__pycache__/health.cpython-310.pyc
src/sagellm_core/__pycache__/health.cpython-311.pyc
src/sagellm_core/__pycache__/llm_engine.cpython-311.pyc
src/sagellm_core/__pycache__/pd_executor.cpython-310.pyc
src/sagellm_core/__pycache__/pd_executor.cpython-311.pyc
src/sagellm_core/__pycache__/plugins.cpython-310.pyc
src/sagellm_core/__pycache__/plugins.cpython-311.pyc
src/sagellm_core/__pycache__/runner.cpython-310.pyc
src/sagellm_core/__pycache__/runner.cpython-311.pyc
src/sagellm_core/__pycache__/runtime.cpython-310.pyc
src/sagellm_core/__pycache__/runtime.cpython-311.pyc
src/sagellm_core/__pycache__/runtime_optimizer.cpython-310.pyc
src/sagellm_core/__pycache__/runtime_optimizer.cpython-311.pyc
src/sagellm_core/__pycache__/workload.cpython-310.pyc
src/sagellm_core/__pycache__/workload.cpython-311.pyc
src/sagellm_core/adapters/__init__.py
src/sagellm_core/adapters/__init__.pyc
src/sagellm_core/adapters/discovery.pyc
src/sagellm_core/adapters/lmdeploy_adapter.pyc
src/sagellm_core/adapters/native_adapter.pyc
src/sagellm_core/adapters/sglang_adapter.pyc
src/sagellm_core/adapters/vllm_adapter.pyc
src/sagellm_core/adapters/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/adapters/__pycache__/discovery.cpython-310.pyc
src/sagellm_core/adapters/__pycache__/lmdeploy_adapter.cpython-310.pyc
src/sagellm_core/adapters/__pycache__/native_adapter.cpython-310.pyc
src/sagellm_core/adapters/__pycache__/sglang_adapter.cpython-310.pyc
src/sagellm_core/adapters/__pycache__/vllm_adapter.cpython-310.pyc
src/sagellm_core/attention/__init__.py
src/sagellm_core/attention/__init__.pyc
src/sagellm_core/attention/layer_registry.pyc
src/sagellm_core/attention/sage_attention.pyc
src/sagellm_core/attention/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/attention/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/attention/__pycache__/layer_registry.cpython-310.pyc
src/sagellm_core/attention/__pycache__/layer_registry.cpython-311.pyc
src/sagellm_core/attention/__pycache__/sage_attention.cpython-310.pyc
src/sagellm_core/attention/__pycache__/sage_attention.cpython-311.pyc
src/sagellm_core/decoding/__init__.py
src/sagellm_core/decoding/__init__.pyc
src/sagellm_core/decoding/base.pyc
src/sagellm_core/decoding/beam_search.pyc
src/sagellm_core/decoding/contrastive.pyc
src/sagellm_core/decoding/greedy.pyc
src/sagellm_core/decoding/sampling.pyc
src/sagellm_core/decoding/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/decoding/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/decoding/__pycache__/base.cpython-310.pyc
src/sagellm_core/decoding/__pycache__/base.cpython-311.pyc
src/sagellm_core/decoding/__pycache__/beam_search.cpython-310.pyc
src/sagellm_core/decoding/__pycache__/beam_search.cpython-311.pyc
src/sagellm_core/decoding/__pycache__/contrastive.cpython-310.pyc
src/sagellm_core/decoding/__pycache__/contrastive.cpython-311.pyc
src/sagellm_core/decoding/__pycache__/greedy.cpython-310.pyc
src/sagellm_core/decoding/__pycache__/greedy.cpython-311.pyc
src/sagellm_core/decoding/__pycache__/sampling.cpython-310.pyc
src/sagellm_core/decoding/__pycache__/sampling.cpython-311.pyc
src/sagellm_core/distributed/__init__.py
src/sagellm_core/distributed/__init__.pyc
src/sagellm_core/distributed/strategies.pyc
src/sagellm_core/distributed/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/distributed/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/distributed/__pycache__/strategies.cpython-310.pyc
src/sagellm_core/distributed/__pycache__/strategies.cpython-311.pyc
src/sagellm_core/engine_core/__init__.py
src/sagellm_core/engine_core/__init__.pyc
src/sagellm_core/engine_core/engine_core.pyc
src/sagellm_core/engine_core/kv_cache_manager.pyc
src/sagellm_core/engine_core/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/engine_core/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/engine_core/__pycache__/engine_core.cpython-310.pyc
src/sagellm_core/engine_core/__pycache__/engine_core.cpython-311.pyc
src/sagellm_core/engine_core/__pycache__/kv_cache_manager.cpython-310.pyc
src/sagellm_core/engine_core/__pycache__/kv_cache_manager.cpython-311.pyc
src/sagellm_core/engine_core/scheduler/__init__.py
src/sagellm_core/engine_core/scheduler/__init__.pyc
src/sagellm_core/engine_core/scheduler/base.pyc
src/sagellm_core/engine_core/scheduler/batch.pyc
src/sagellm_core/engine_core/scheduler/metrics.pyc
src/sagellm_core/engine_core/scheduler/scheduler.pyc
src/sagellm_core/engine_core/scheduler/scheduler_kv_bridge.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/base.cpython-310.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/base.cpython-311.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/batch.cpython-310.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/batch.cpython-311.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/metrics.cpython-310.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/metrics.cpython-311.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/scheduler.cpython-310.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/scheduler.cpython-311.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/scheduler_kv_bridge.cpython-310.pyc
src/sagellm_core/engine_core/scheduler/__pycache__/scheduler_kv_bridge.cpython-311.pyc
src/sagellm_core/engine_core/scheduler/policy/__init__.py
src/sagellm_core/engine_core/scheduler/policy/__init__.pyc
src/sagellm_core/engine_core/scheduler/policy/fcfs.pyc
src/sagellm_core/engine_core/scheduler/policy/priority.pyc
src/sagellm_core/engine_core/scheduler/policy/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/engine_core/scheduler/policy/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/engine_core/scheduler/policy/__pycache__/fcfs.cpython-310.pyc
src/sagellm_core/engine_core/scheduler/policy/__pycache__/fcfs.cpython-311.pyc
src/sagellm_core/engine_core/scheduler/policy/__pycache__/priority.cpython-310.pyc
src/sagellm_core/engine_core/scheduler/policy/__pycache__/priority.cpython-311.pyc
src/sagellm_core/engines/__init__.py
src/sagellm_core/engines/__init__.pyc
src/sagellm_core/engines/cpu_embedding.pyc
src/sagellm_core/engines/embedding.pyc
src/sagellm_core/engines/registry.pyc
src/sagellm_core/engines/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/engines/__pycache__/cpu_embedding.cpython-311.pyc
src/sagellm_core/engines/__pycache__/embedding.cpython-311.pyc
src/sagellm_core/engines/__pycache__/registry.cpython-311.pyc
src/sagellm_core/executor/__init__.py
src/sagellm_core/executor/__init__.pyc
src/sagellm_core/executor/executor_base.pyc
src/sagellm_core/executor/uniproc_executor.pyc
src/sagellm_core/executor/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/executor/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/executor/__pycache__/executor_base.cpython-310.pyc
src/sagellm_core/executor/__pycache__/executor_base.cpython-311.pyc
src/sagellm_core/executor/__pycache__/uniproc_executor.cpython-310.pyc
src/sagellm_core/executor/__pycache__/uniproc_executor.cpython-311.pyc
src/sagellm_core/inputs/__init__.py
src/sagellm_core/inputs/__init__.pyc
src/sagellm_core/inputs/processor.pyc
src/sagellm_core/inputs/tokenizer_utils.pyc
src/sagellm_core/inputs/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/inputs/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/inputs/__pycache__/processor.cpython-310.pyc
src/sagellm_core/inputs/__pycache__/processor.cpython-311.pyc
src/sagellm_core/inputs/__pycache__/tokenizer_utils.cpython-310.pyc
src/sagellm_core/inputs/__pycache__/tokenizer_utils.cpython-311.pyc
src/sagellm_core/kernel/__init__.py
src/sagellm_core/kernel/__init__.pyc
src/sagellm_core/kernel/fusion_detector.pyc
src/sagellm_core/kernel/kernel_injector.pyc
src/sagellm_core/kernel/kernel_loader.pyc
src/sagellm_core/kernel/kernel_registry.pyc
src/sagellm_core/kernel/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/kernel/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/kernel/__pycache__/fusion_detector.cpython-310.pyc
src/sagellm_core/kernel/__pycache__/fusion_detector.cpython-311.pyc
src/sagellm_core/kernel/__pycache__/kernel_injector.cpython-310.pyc
src/sagellm_core/kernel/__pycache__/kernel_injector.cpython-311.pyc
src/sagellm_core/kernel/__pycache__/kernel_loader.cpython-310.pyc
src/sagellm_core/kernel/__pycache__/kernel_loader.cpython-311.pyc
src/sagellm_core/kernel/__pycache__/kernel_registry.cpython-310.pyc
src/sagellm_core/kernel/__pycache__/kernel_registry.cpython-311.pyc
src/sagellm_core/kernel_injection/__init__.py
src/sagellm_core/kernel_injection/__init__.pyc
src/sagellm_core/kernel_injection/backend_bridge.pyc
src/sagellm_core/kernel_injection/fused_kernels.pyc
src/sagellm_core/kernel_injection/integration.pyc
src/sagellm_core/kernel_injection/kernel_injector.pyc
src/sagellm_core/kernel_injection/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/kernel_injection/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/kernel_injection/__pycache__/backend_bridge.cpython-310.pyc
src/sagellm_core/kernel_injection/__pycache__/backend_bridge.cpython-311.pyc
src/sagellm_core/kernel_injection/__pycache__/fused_kernels.cpython-310.pyc
src/sagellm_core/kernel_injection/__pycache__/fused_kernels.cpython-311.pyc
src/sagellm_core/kernel_injection/__pycache__/integration.cpython-310.pyc
src/sagellm_core/kernel_injection/__pycache__/integration.cpython-311.pyc
src/sagellm_core/kernel_injection/__pycache__/kernel_injector.cpython-310.pyc
src/sagellm_core/kernel_injection/__pycache__/kernel_injector.cpython-311.pyc
src/sagellm_core/model/__init__.py
src/sagellm_core/model/__init__.pyc
src/sagellm_core/model/hf_loader.pyc
src/sagellm_core/model/layerwise_loader.pyc
src/sagellm_core/model/load_config.pyc
src/sagellm_core/model/loader.pyc
src/sagellm_core/model/model_loader.pyc
src/sagellm_core/model/quantization.pyc
src/sagellm_core/model/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/model/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/model/__pycache__/hf_loader.cpython-310.pyc
src/sagellm_core/model/__pycache__/hf_loader.cpython-311.pyc
src/sagellm_core/model/__pycache__/layerwise_loader.cpython-310.pyc
src/sagellm_core/model/__pycache__/layerwise_loader.cpython-311.pyc
src/sagellm_core/model/__pycache__/load_config.cpython-310.pyc
src/sagellm_core/model/__pycache__/load_config.cpython-311.pyc
src/sagellm_core/model/__pycache__/loader.cpython-310.pyc
src/sagellm_core/model/__pycache__/loader.cpython-311.pyc
src/sagellm_core/model/__pycache__/model_loader.cpython-310.pyc
src/sagellm_core/model/__pycache__/model_loader.cpython-311.pyc
src/sagellm_core/model/__pycache__/quantization.cpython-310.pyc
src/sagellm_core/model/__pycache__/quantization.cpython-311.pyc
src/sagellm_core/model/architectures/__init__.py
src/sagellm_core/model/architectures/__init__.pyc
src/sagellm_core/model/architectures/base.pyc
src/sagellm_core/model/architectures/llama.pyc
src/sagellm_core/model/architectures/qwen.pyc
src/sagellm_core/model/architectures/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/model/architectures/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/model/architectures/__pycache__/base.cpython-310.pyc
src/sagellm_core/model/architectures/__pycache__/base.cpython-311.pyc
src/sagellm_core/model/architectures/__pycache__/llama.cpython-310.pyc
src/sagellm_core/model/architectures/__pycache__/llama.cpython-311.pyc
src/sagellm_core/model/architectures/__pycache__/qwen.cpython-310.pyc
src/sagellm_core/model/architectures/__pycache__/qwen.cpython-311.pyc
src/sagellm_core/model/layers/__init__.py
src/sagellm_core/model/layers/__init__.pyc
src/sagellm_core/model/layers/fused_layers.pyc
src/sagellm_core/model/layers/layer_replacement.pyc
src/sagellm_core/model/layers/linear.pyc
src/sagellm_core/model/layers/normalization.pyc
src/sagellm_core/model/layers/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/model/layers/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/model/layers/__pycache__/fused_layers.cpython-310.pyc
src/sagellm_core/model/layers/__pycache__/fused_layers.cpython-311.pyc
src/sagellm_core/model/layers/__pycache__/layer_replacement.cpython-310.pyc
src/sagellm_core/model/layers/__pycache__/layer_replacement.cpython-311.pyc
src/sagellm_core/model/layers/__pycache__/linear.cpython-310.pyc
src/sagellm_core/model/layers/__pycache__/linear.cpython-311.pyc
src/sagellm_core/model/layers/__pycache__/normalization.cpython-310.pyc
src/sagellm_core/model/layers/__pycache__/normalization.cpython-311.pyc
src/sagellm_core/observability/__init__.py
src/sagellm_core/observability/__init__.pyc
src/sagellm_core/observability/logger.pyc
src/sagellm_core/observability/metrics.pyc
src/sagellm_core/observability/prometheus.pyc
src/sagellm_core/observability/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/observability/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/observability/__pycache__/logger.cpython-310.pyc
src/sagellm_core/observability/__pycache__/logger.cpython-311.pyc
src/sagellm_core/observability/__pycache__/metrics.cpython-310.pyc
src/sagellm_core/observability/__pycache__/metrics.cpython-311.pyc
src/sagellm_core/observability/__pycache__/prometheus.cpython-310.pyc
src/sagellm_core/observability/__pycache__/prometheus.cpython-311.pyc
src/sagellm_core/sampling/__init__.py
src/sagellm_core/sampling/__init__.pyc
src/sagellm_core/sampling/params.pyc
src/sagellm_core/sampling/sampler.pyc
src/sagellm_core/sampling/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/sampling/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/sampling/__pycache__/params.cpython-310.pyc
src/sagellm_core/sampling/__pycache__/params.cpython-311.pyc
src/sagellm_core/sampling/__pycache__/sampler.cpython-310.pyc
src/sagellm_core/sampling/__pycache__/sampler.cpython-311.pyc
src/sagellm_core/worker/__init__.py
src/sagellm_core/worker/__init__.pyc
src/sagellm_core/worker/worker.pyc
src/sagellm_core/worker/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/worker/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/worker/__pycache__/worker.cpython-310.pyc
src/sagellm_core/worker/__pycache__/worker.cpython-311.pyc
src/sagellm_core/worker/model_runner/__init__.py
src/sagellm_core/worker/model_runner/__init__.pyc
src/sagellm_core/worker/model_runner/kernel_layers.pyc
src/sagellm_core/worker/model_runner/model_runner.pyc
src/sagellm_core/worker/model_runner/__pycache__/__init__.cpython-310.pyc
src/sagellm_core/worker/model_runner/__pycache__/__init__.cpython-311.pyc
src/sagellm_core/worker/model_runner/__pycache__/kernel_layers.cpython-310.pyc
src/sagellm_core/worker/model_runner/__pycache__/kernel_layers.cpython-311.pyc
src/sagellm_core/worker/model_runner/__pycache__/model_runner.cpython-310.pyc
src/sagellm_core/worker/model_runner/__pycache__/model_runner.cpython-311.pyc
tests/test_adaptive_precision_strategy.py
tests/test_attention.py
tests/test_backend_kernel_usage.py
tests/test_ci_smoke.py
tests/test_compute_comm_overlap_strategy.py
tests/test_config.py
tests/test_cpu_embedding_engine.py
tests/test_cuda_graph_capture_strategy.py
tests/test_decoding_strategies.py
tests/test_dynamic_batching_strategy.py
tests/test_e2e_llm_integration.py
tests/test_embedding_server.py
tests/test_engine.py
tests/test_engine_behavior_parity.py
tests/test_engine_contract_simplified.py
tests/test_engine_server.py
tests/test_fused_kernels.py
tests/test_kernel_injection.py
tests/test_kv_cache_integration_e2e.py
tests/test_kv_compute_coopt_strategy.py
tests/test_layer_replacement.py
tests/test_llm_engine_backend_runtime.py
tests/test_llm_engine_contract.py
tests/test_llm_engine_decoding.py
tests/test_llm_engine_error_handling.py
tests/test_llm_engine_task2_interfaces.py
tests/test_model_loader.py
tests/test_model_runner_attention_integration.py
tests/test_observability.py
tests/test_operator_mapping_integration.py
tests/test_pd_separation.py
tests/test_prefix_cache_integration.py
tests/test_runtime_optimizer.py
tests/test_sampling.py
tests/test_scheduler_kv_integration.py
tests/test_streaming_pd.py
tests/test_task0_10_workload.py
tests/test_task3_loader_orchestration.py