MANIFEST.in
README.md
setup.py
csrc/dp_core.cpp
galvatron/__init__.py
galvatron/core/__init__.py
galvatron/core/arguments.py
galvatron/core/comm_groups.py
galvatron/core/cost_model.py
galvatron/core/dataloader.py
galvatron/core/dynamic_programming.py
galvatron/core/hybrid_parallel_config.py
galvatron/core/hybrid_parallel_model.py
galvatron/core/initialize.py
galvatron/core/parallel.py
galvatron/core/profiler.py
galvatron/core/redistribute.py
galvatron/core/search_engine.py
galvatron/core/pipeline/__init__.py
galvatron/core/pipeline/grad_reduce.py
galvatron/core/pipeline/pipeline.py
galvatron/core/pipeline/utils.py
galvatron/core/tensor_parallel/__init__.py
galvatron/core/tensor_parallel/transformer.py
galvatron/core/tensor_parallel/utils.py
galvatron/models/__init__.py
galvatron/models/baichuan/BaiChuanModel_hybrid_parallel.py
galvatron/models/baichuan/BaiChuanModel_sequential.py
galvatron/models/baichuan/BaiChuanModel_tensor_parallel.py
galvatron/models/baichuan/__init__.py
galvatron/models/baichuan/arguments.py
galvatron/models/baichuan/dataloader.py
galvatron/models/baichuan/profile.py
galvatron/models/baichuan/search_dist.py
galvatron/models/baichuan/train.py
galvatron/models/baichuan/train_dist.py
galvatron/models/baichuan/configs/computation_profiling_bf16_hidden4096_head32_seqlen2048.json
galvatron/models/baichuan/configs/galvatron_config_baichuan-7b_2nodes_8gpus_per_node_40GB_bf16_3D_example.json
galvatron/models/baichuan/configs/galvatron_config_baichuan-7b_2nodes_8gpus_per_node_40GB_bf16_example.json
galvatron/models/baichuan/configs/memory_profiling_bf16_hidden4096_head32_seqlen2048.json
galvatron/models/baichuan/hf_configs/__init__.py
galvatron/models/baichuan/hf_configs/config_utils.py
galvatron/models/baichuan/hf_configs/baichuan-7b/config.json
galvatron/models/baichuan/hf_configs/baichuan-7b/config_ori.json
galvatron/models/bert/BertModel_hybrid_parallel.py
galvatron/models/bert/BertModel_sequential.py
galvatron/models/bert/BertModel_tensor_parallel.py
galvatron/models/bert/__init__.py
galvatron/models/bert/arguments.py
galvatron/models/bert/dataloader.py
galvatron/models/bert/profile.py
galvatron/models/bert/search_dist.py
galvatron/models/bert/train.py
galvatron/models/bert/train_dist.py
galvatron/models/bert/configs/computation_profiling_bf16_hidden1024_head16_seqlen512.json
galvatron/models/bert/configs/computation_profiling_bf16_hidden1280_head16_seqlen512.json
galvatron/models/bert/configs/galvatron_config_16gpus_1024hidden_24layers_example.json
galvatron/models/bert/configs/galvatron_config_16gpus_1280hidden_32layers_example.json
galvatron/models/bert/configs/galvatron_config_4gpus_1024hidden_24layers_example.json
galvatron/models/bert/configs/galvatron_config_4gpus_1280hidden_32layers_example.json
galvatron/models/bert/configs/galvatron_config_8gpus_1024hidden_24layers_example.json
galvatron/models/bert/configs/galvatron_config_8gpus_1280hidden_32layers_12G_full.json
galvatron/models/bert/configs/galvatron_config_8gpus_1280hidden_32layers_8G_full.json
galvatron/models/bert/configs/galvatron_config_8gpus_1280hidden_32layers_example.json
galvatron/models/bert/configs/memory_profiling_bf16_hidden1024_head16_seqlen512.json
galvatron/models/bert/configs/memory_profiling_bf16_hidden1280_head16_seqlen512.json
galvatron/models/bert/configs/memory_profiling_fp32_hidden1024_head16_seqlen512.json
galvatron/models/bert/configs/memory_profiling_fp32_hidden1280_head16_seqlen512.json
galvatron/models/bert/hf_configs/__init__.py
galvatron/models/bert/hf_configs/bert-base-uncased.json
galvatron/models/bert/hf_configs/bert-huge-uncased-32.json
galvatron/models/bert/hf_configs/bert-huge-uncased-48.json
galvatron/models/bert/hf_configs/bert-large-uncased.json
galvatron/models/bert/hf_configs/config_utils.py
galvatron/models/chatglm2/ChatGLMModel_hybrid_parallel.py
galvatron/models/chatglm2/ChatGLMModel_sequential.py
galvatron/models/chatglm2/ChatGLMModel_tensor_parallel.py
galvatron/models/chatglm2/__init__.py
galvatron/models/chatglm2/arguments.py
galvatron/models/chatglm2/dataloader.py
galvatron/models/chatglm2/profile.py
galvatron/models/chatglm2/search_dist.py
galvatron/models/chatglm2/train.py
galvatron/models/chatglm2/train_dist.py
galvatron/models/chatglm2/configs/computation_profiling_bf16_hidden4096_head32_seqlen2048.json
galvatron/models/chatglm2/configs/galvatron_config_hidden4096_head32_seqlen2048_2nodes_8gpus_per_node_24GB_bf16_zero2_[tp_off].json
galvatron/models/chatglm2/configs/galvatron_config_hidden4096_head32_seqlen2048_2nodes_8gpus_per_node_28GB_bf16_zero2_[tp_off].json
galvatron/models/chatglm2/configs/galvatron_config_hidden4096_head32_seqlen2048_2nodes_8gpus_per_node_30GB_bf16_zero2_[tp_off].json
galvatron/models/chatglm2/configs/galvatron_config_hidden4096_head32_seqlen2048_2nodes_8gpus_per_node_33GB_bf16_zero2_[tp_off].json
galvatron/models/chatglm2/configs/galvatron_config_hidden4096_head32_seqlen2048_2nodes_8gpus_per_node_40GB_bf16_zero2_[tp_off].json
galvatron/models/chatglm2/configs/memory_profiling_bf16_hidden4096_head32_seqlen2048.json
galvatron/models/chatglm2/hf_configs/__init__.py
galvatron/models/chatglm2/hf_configs/config_utils.py
galvatron/models/chatglm2/hf_configs/chatglm2-6b/config copy.json
galvatron/models/chatglm2/hf_configs/chatglm2-6b/config.json
galvatron/models/chatglm2/hf_configs/chatglm2-6b/tokenizer_config.json
galvatron/models/clip/CLIPModel_hybrid_parallel.py
galvatron/models/clip/CLIPModel_sequential.py
galvatron/models/clip/CLIPModel_tensor_parallel.py
galvatron/models/clip/__init__.py
galvatron/models/clip/arguments.py
galvatron/models/clip/dataloader.py
galvatron/models/clip/profile.py
galvatron/models/clip/search_dist.py
galvatron/models/clip/train.py
galvatron/models/clip/train_dist.py
galvatron/models/clip/configs/computation_profiling_bf16_CLIP-vit-H-14.json
galvatron/models/clip/configs/computation_profiling_bf16_CLIP-vit-L-14.json
galvatron/models/clip/configs/computation_profiling_bf16_CLIP-vit-g-14.json
galvatron/models/clip/configs/galvatron_config_8gpus_vit-H-14_24G_example.json
galvatron/models/clip/configs/memory_profiling_bf16_CLIP-vit-H-14.json
galvatron/models/clip/configs/memory_profiling_bf16_CLIP-vit-L-14.json
galvatron/models/clip/configs/memory_profiling_bf16_CLIP-vit-bigG-14.json
galvatron/models/clip/configs/memory_profiling_bf16_CLIP-vit-g-14.json
galvatron/models/clip/hf_configs/CLIP-ViT-B-16.json
galvatron/models/clip/hf_configs/CLIP-ViT-H-14-laion2B-s32B-b79K.json
galvatron/models/clip/hf_configs/CLIP-ViT-L-14-laion2B-s32B-b82K.json
galvatron/models/clip/hf_configs/CLIP-ViT-bigG-14-laion2B-39B-b160k.json
galvatron/models/clip/hf_configs/CLIP-ViT-g-14-laion2B-s12B-b42K.json
galvatron/models/clip/hf_configs/__init__.py
galvatron/models/clip/hf_configs/config_utils.py
galvatron/models/gpt/GPTModel_hybrid_parallel.py
galvatron/models/gpt/GPTModel_sequential.py
galvatron/models/gpt/GPTModel_tensor_parallel.py
galvatron/models/gpt/__init__.py
galvatron/models/gpt/arguments.py
galvatron/models/gpt/dataloader.py
galvatron/models/gpt/profile.py
galvatron/models/gpt/search_dist.py
galvatron/models/gpt/train.py
galvatron/models/gpt/train_dist.py
galvatron/models/gpt/configs/computation_profiling_bf16_hidden1600_head32_seqlen1024.json
galvatron/models/gpt/configs/computation_profiling_bf16_hidden2560_head32_seqlen2048.json
galvatron/models/gpt/configs/computation_profiling_bf16_hidden4096_head32_seqlen2048.json
galvatron/models/gpt/configs/galvatron_config_gpt-1.5b_2nodes_8gpus_per_node_40GB_bf16_3D_example.json
galvatron/models/gpt/configs/galvatron_config_gpt-1.5b_2nodes_8gpus_per_node_40GB_bf16_example.json
galvatron/models/gpt/configs/galvatron_config_gpt-2.7b_2nodes_8gpus_per_node_40GB_bf16_3D_example.json
galvatron/models/gpt/configs/galvatron_config_gpt-2.7b_2nodes_8gpus_per_node_40GB_bf16_example.json
galvatron/models/gpt/configs/galvatron_config_gpt-6.7b_2nodes_8gpus_per_node_40GB_bf16_3D_example.json
galvatron/models/gpt/configs/galvatron_config_gpt-6.7b_2nodes_8gpus_per_node_40GB_bf16_example.json
galvatron/models/gpt/configs/memory_profiling_bf16_hidden1600_head32_seqlen1024.json
galvatron/models/gpt/configs/memory_profiling_bf16_hidden2560_head32_seqlen2048.json
galvatron/models/gpt/configs/memory_profiling_bf16_hidden4096_head32_seqlen2048.json
galvatron/models/gpt/meta_configs/__init__.py
galvatron/models/gpt/meta_configs/config_utils.py
galvatron/models/gpt/meta_configs/gpt-0.3b.json
galvatron/models/gpt/meta_configs/gpt-1.5b.json
galvatron/models/gpt/meta_configs/gpt-2.7b.json
galvatron/models/gpt/meta_configs/gpt-6.7b.json
galvatron/models/llama/LlamaModel_hybrid_parallel.py
galvatron/models/llama/LlamaModel_sequential.py
galvatron/models/llama/LlamaModel_tensor_parallel.py
galvatron/models/llama/__init__.py
galvatron/models/llama/arguments.py
galvatron/models/llama/dataloader.py
galvatron/models/llama/profile.py
galvatron/models/llama/search_dist.py
galvatron/models/llama/train.py
galvatron/models/llama/train_dist.py
galvatron/models/llama/configs/computation_profiling_bf16_hidden4096_head32_seqlen2048.json
galvatron/models/llama/configs/galvatron_config_llama-7b_2nodes_8gpus_per_node_40GB_bf16_3D_example.json
galvatron/models/llama/configs/galvatron_config_llama-7b_2nodes_8gpus_per_node_40GB_bf16_example.json
galvatron/models/llama/configs/memory_profiling_bf16_hidden4096_head32_seqlen2048.json
galvatron/models/llama/meta_configs/__init__.py
galvatron/models/llama/meta_configs/config_utils.py
galvatron/models/llama/meta_configs/llama-13b.json
galvatron/models/llama/meta_configs/llama-30b.json
galvatron/models/llama/meta_configs/llama-7b.json
galvatron/models/swin/SwinModel_hybrid_parallel.py
galvatron/models/swin/SwinModel_sequential.py
galvatron/models/swin/SwinModel_tensor_parallel.py
galvatron/models/swin/__init__.py
galvatron/models/swin/arguments.py
galvatron/models/swin/dataloader.py
galvatron/models/swin/profile.py
galvatron/models/swin/search_dist.py
galvatron/models/swin/train.py
galvatron/models/swin/train_dist.py
galvatron/models/swin/configs/backup.json
galvatron/models/swin/configs/computation_profiling_bf16_embed320_head[8,16,32,64]_patch4_window7_img224.json
galvatron/models/swin/configs/memory_profiling_bf16_embed320_head[8,16,32,64]_patch4_window7_img224.json
galvatron/models/swin/configs/memory_profiling_fp32_embed320_head[8,16,32,64]_patch4_window7_img224.json
galvatron/models/swin/hf_configs/__init__.py
galvatron/models/swin/hf_configs/config_utils.py
galvatron/models/swin/hf_configs/swin-huge-layer32-patch4-window7-224.json
galvatron/models/swin/hf_configs/swin-huge-layer48-patch4-window7-224.json
galvatron/models/t5/T5Model_hybrid_parallel.py
galvatron/models/t5/T5Model_sequential.py
galvatron/models/t5/T5Model_tensor_parallel.py
galvatron/models/t5/__init__.py
galvatron/models/t5/arguments.py
galvatron/models/t5/dataloader.py
galvatron/models/t5/profile.py
galvatron/models/t5/train.py
galvatron/models/t5/train_dist.py
galvatron/models/t5/hf_configs/__init__.py
galvatron/models/t5/hf_configs/config_utils.py
galvatron/models/t5/hf_configs/t5-base.json
galvatron/models/t5/hf_configs/t5-large.json
galvatron/models/vit/ViTModel_hybrid_parallel.py
galvatron/models/vit/ViTModel_sequential.py
galvatron/models/vit/ViTModel_tensor_parallel.py
galvatron/models/vit/__init__.py
galvatron/models/vit/arguments.py
galvatron/models/vit/dataloader.py
galvatron/models/vit/profile.py
galvatron/models/vit/search_dist.py
galvatron/models/vit/train.py
galvatron/models/vit/train_dist.py
galvatron/models/vit/configs/computation_profiling_bf16_hidden1024_head16_patch16_img224.json
galvatron/models/vit/configs/computation_profiling_bf16_hidden1280_head16_patch14_img224.json
galvatron/models/vit/configs/galvatron_config_hidden1024_head16_patch16_img224_1nodes_8gpus_per_node_40GB_bf16.json
galvatron/models/vit/configs/memory_profiling_bf16_hidden1024_head16_patch16_img224.json
galvatron/models/vit/configs/memory_profiling_bf16_hidden1280_head16_patch14_img224.json
galvatron/models/vit/configs/memory_profiling_fp32_hidden1024_head16_patch16_img224.json
galvatron/models/vit/configs/memory_profiling_fp32_hidden1280_head16_patch14_img224.json
galvatron/models/vit/hf_configs/__init__.py
galvatron/models/vit/hf_configs/config_utils.py
galvatron/models/vit/hf_configs/vit-huge-patch14-224-layer48.json
galvatron/models/vit/hf_configs/vit-huge-patch14-224.json
galvatron/models/vit/hf_configs/vit-large-patch16-224.json
galvatron/models_baseline/__init__.py
galvatron/models_baseline/utils.py
galvatron/models_baseline/baichuan/ds_config.json
galvatron/models_baseline/baichuan/baichuan-config/baichuan-7b/config.json
galvatron/models_baseline/baichuan/baichuan-config/baichuan-7b/config_ori.json
galvatron/models_baseline/bert/ds_config.json
galvatron/models_baseline/bert/bert_hf_configs/bert-base-uncased.json
galvatron/models_baseline/bert/bert_hf_configs/bert-huge-uncased-32.json
galvatron/models_baseline/bert/bert_hf_configs/bert-huge-uncased-48.json
galvatron/models_baseline/bert/bert_hf_configs/bert-large-uncased.json
galvatron/models_baseline/chatglm2/ds_config.json
galvatron/models_baseline/chatglm2/models/chatglm2-6b/config.json
galvatron/models_baseline/chatglm2/models/chatglm2-6b/tokenizer_config.json
galvatron/models_baseline/clip/ds_config.json
galvatron/models_baseline/clip/clip_hf_configs/CLIP-ViT-B-16.json
galvatron/models_baseline/clip/clip_hf_configs/CLIP-ViT-H-14-laion2B-s32B-b79K.json
galvatron/models_baseline/clip/clip_hf_configs/CLIP-ViT-L-14-laion2B-s32B-b82K.json
galvatron/models_baseline/clip/clip_hf_configs/CLIP-ViT-bigG-14-laion2B-39B-b160k.json
galvatron/models_baseline/clip/clip_hf_configs/CLIP-ViT-g-14-laion2B-s12B-b42K.json
galvatron/models_baseline/gpt/ds_config.json
galvatron/models_baseline/gpt/gpt-config/gpt-0.3b.json
galvatron/models_baseline/gpt/gpt-config/gpt-1.5b.json
galvatron/models_baseline/gpt/gpt-config/gpt-2.7b.json
galvatron/models_baseline/gpt/gpt-config/gpt-6.7b.json
galvatron/models_baseline/llama/ds_config.json
galvatron/models_baseline/llama/llama-config/llama-13b/params.json
galvatron/models_baseline/llama/llama-config/llama-13b/llama-13b/config.json
galvatron/models_baseline/llama/llama-config/llama-30b/params.json
galvatron/models_baseline/llama/llama-config/llama-30b/llama-30b/config.json
galvatron/models_baseline/llama/llama-config/llama-7b/params.json
galvatron/models_baseline/llama/llama-config/llama-7b/llama-7b/config.json
galvatron/models_baseline/swin/ds_config.json
galvatron/models_baseline/swin/swin_hf_configs/swin-huge-layer32-patch4-window7-224.json
galvatron/models_baseline/swin/swin_hf_configs/swin-huge-layer48-patch4-window7-224.json
galvatron/models_baseline/t5/ds_config.json
galvatron/models_baseline/t5/t5_hf_configs/t5-base.json
galvatron/models_baseline/t5/t5_hf_configs/t5-large.json
galvatron/models_baseline/vit/ds_config.json
galvatron/models_baseline/vit/hf_configs/vit-huge-patch14-224-layer48.json
galvatron/models_baseline/vit/hf_configs/vit-huge-patch14-224.json
galvatron/models_baseline/vit/hf_configs/vit-large-patch16-224.json
galvatron/profile_hardware/hardware_configs/allreduce_bandwidth_1nodes_4gpus_per_node.json
galvatron/profile_hardware/hardware_configs/allreduce_bandwidth_1nodes_8gpus_per_node.json
galvatron/profile_hardware/hardware_configs/allreduce_bandwidth_2nodes_8gpus_per_node.json
galvatron/profile_hardware/hardware_configs/overlap_coefficient.json
galvatron/profile_hardware/hardware_configs/p2p_bandwidth_1nodes_4gpus_per_node.json
galvatron/profile_hardware/hardware_configs/p2p_bandwidth_1nodes_8gpus_per_node.json
galvatron/profile_hardware/hardware_configs/p2p_bandwidth_2nodes_8gpus_per_node.json
galvatron/scripts/flash_attn_ops_install.sh
galvatron/site_package/__init__.py
galvatron/site_package/megatron/__init__.py
galvatron/site_package/megatron/arguments.py
galvatron/site_package/megatron/checkpointing.py
galvatron/site_package/megatron/dist_signal_handler.py
galvatron/site_package/megatron/global_vars.py
galvatron/site_package/megatron/indexer.py
galvatron/site_package/megatron/initialize.py
galvatron/site_package/megatron/memory.py
galvatron/site_package/megatron/microbatches.py
galvatron/site_package/megatron/optimizer_param_scheduler.py
galvatron/site_package/megatron/text_generation_server.py
galvatron/site_package/megatron/timers.py
galvatron/site_package/megatron/training.py
galvatron/site_package/megatron/utils.py
galvatron/site_package/megatron/core/__init__.py
galvatron/site_package/megatron/core/enums.py
galvatron/site_package/megatron/core/package_info.py
galvatron/site_package/megatron/core/parallel_state.py
galvatron/site_package/megatron/core/utils.py
galvatron/site_package/megatron/core/pipeline_parallel/__init__.py
galvatron/site_package/megatron/core/pipeline_parallel/p2p_communication.py
galvatron/site_package/megatron/core/pipeline_parallel/schedules.py
galvatron/site_package/megatron/core/tensor_parallel/__init__.py
galvatron/site_package/megatron/core/tensor_parallel/cross_entropy.py
galvatron/site_package/megatron/core/tensor_parallel/data.py
galvatron/site_package/megatron/core/tensor_parallel/layers.py
galvatron/site_package/megatron/core/tensor_parallel/mappings.py
galvatron/site_package/megatron/core/tensor_parallel/mappings_group.py
galvatron/site_package/megatron/core/tensor_parallel/random.py
galvatron/site_package/megatron/core/tensor_parallel/utils.py
galvatron/site_package/megatron/data/__init__.py
galvatron/site_package/megatron/data/autoaugment.py
galvatron/site_package/megatron/data/bert_dataset.py
galvatron/site_package/megatron/data/biencoder_dataset_utils.py
galvatron/site_package/megatron/data/blendable_dataset.py
galvatron/site_package/megatron/data/data_samplers.py
galvatron/site_package/megatron/data/dataset_utils.py
galvatron/site_package/megatron/data/gpt_dataset.py
galvatron/site_package/megatron/data/ict_dataset.py
galvatron/site_package/megatron/data/indexed_dataset.py
galvatron/site_package/megatron/data/orqa_wiki_dataset.py
galvatron/site_package/megatron/data/realm_dataset_utils.py
galvatron/site_package/megatron/data/realm_index.py
galvatron/site_package/megatron/data/t5_dataset.py
galvatron/site_package/megatron/data/vit_dataset.py
galvatron/site_package/megatron/fused_kernels/__init__.py
galvatron/site_package/megatron/fused_kernels/tests/__init__.py
galvatron/site_package/megatron/fused_kernels/tests/test_fused_kernels.py
galvatron/site_package/megatron/model/__init__.py
galvatron/site_package/megatron/model/bert_model.py
galvatron/site_package/megatron/model/biencoder_model.py
galvatron/site_package/megatron/model/classification.py
galvatron/site_package/megatron/model/distributed.py
galvatron/site_package/megatron/model/enums.py
galvatron/site_package/megatron/model/fused_bias_gelu.py
galvatron/site_package/megatron/model/fused_layer_norm.py
galvatron/site_package/megatron/model/fused_softmax.py
galvatron/site_package/megatron/model/gpt_model.py
galvatron/site_package/megatron/model/language_model.py
galvatron/site_package/megatron/model/module.py
galvatron/site_package/megatron/model/multiple_choice.py
galvatron/site_package/megatron/model/realm_model.py
galvatron/site_package/megatron/model/retro_transformer.py
galvatron/site_package/megatron/model/rotary_pos_embedding.py
galvatron/site_package/megatron/model/t5_model.py
galvatron/site_package/megatron/model/transformer.py
galvatron/site_package/megatron/model/utils.py
galvatron/site_package/megatron/optimizer/__init__.py
galvatron/site_package/megatron/optimizer/clip_grads.py
galvatron/site_package/megatron/optimizer/distrib_optimizer.py
galvatron/site_package/megatron/optimizer/grad_scaler.py
galvatron/site_package/megatron/optimizer/optimizer.py
galvatron/site_package/megatron/text_generation/__init__.py
galvatron/site_package/megatron/text_generation/api.py
galvatron/site_package/megatron/text_generation/beam_utils.py
galvatron/site_package/megatron/text_generation/communication.py
galvatron/site_package/megatron/text_generation/forward_step.py
galvatron/site_package/megatron/text_generation/generation.py
galvatron/site_package/megatron/text_generation/sampling.py
galvatron/site_package/megatron/text_generation/tokenization.py
galvatron/site_package/megatron/tokenizer/__init__.py
galvatron/site_package/megatron/tokenizer/bert_tokenization.py
galvatron/site_package/megatron/tokenizer/gpt2_tokenization.py
galvatron/site_package/megatron/tokenizer/tokenizer.py
galvatron/utils/__init__.py
galvatron/utils/config_utils.py
galvatron/utils/memory_utils.py
galvatron/utils/strategy_utils.py
galvatron/utils/training_utils.py
hetu_galvatron.egg-info/PKG-INFO
hetu_galvatron.egg-info/SOURCES.txt
hetu_galvatron.egg-info/dependency_links.txt
hetu_galvatron.egg-info/requires.txt
hetu_galvatron.egg-info/top_level.txt