LICENSE
MANIFEST.in
README.md
requirements.txt
setup.py
SwissArmyTransformer.egg-info/PKG-INFO
SwissArmyTransformer.egg-info/SOURCES.txt
SwissArmyTransformer.egg-info/dependency_links.txt
SwissArmyTransformer.egg-info/requires.txt
SwissArmyTransformer.egg-info/top_level.txt
sat/__init__.py
sat/arguments.py
sat/helpers.py
sat/transformer_defaults.py
sat/data_utils/__init__.py
sat/data_utils/configure_data.py
sat/data_utils/datasets.py
sat/data_utils/hf_dataset.py
sat/data_utils/jsonlds.py
sat/data_utils/samplers.py
sat/data_utils/webds.py
sat/generation/__init__.py
sat/generation/autoregressive_sampling.py
sat/generation/cuda2d_sampling.py
sat/generation/magnify.py
sat/generation/utils.py
sat/generation/sampling_strategies/__init__.py
sat/generation/sampling_strategies/base_strategy.py
sat/generation/sampling_strategies/beam_search_strategy.py
sat/generation/sampling_strategies/iterative_entfilter_strategy.py
sat/model/__init__.py
sat/model/base_model.py
sat/model/cached_autoregressive_model.py
sat/model/encoder_decoder_model.py
sat/model/mixins.py
sat/model/registry.py
sat/model/transformer.py
sat/model/attention/__init__.py
sat/model/attention/memory_efficient_attention.py
sat/model/finetune/__init__.py
sat/model/finetune/adapter.py
sat/model/finetune/ffadd.py
sat/model/finetune/lora.py
sat/model/finetune/lora2.py
sat/model/finetune/mlp_head.py
sat/model/finetune/prompt_tuning.py
sat/model/official/__init__.py
sat/model/official/bert_model.py
sat/model/official/cait_model.py
sat/model/official/chatglm2_model.py
sat/model/official/chatglm3_model.py
sat/model/official/chatglm4_model.py
sat/model/official/chatglm_model.py
sat/model/official/clip_model.py
sat/model/official/cuda2d_model.py
sat/model/official/distill_model.py
sat/model/official/dpr_model.py
sat/model/official/eva2_model.py
sat/model/official/eva_clip_model.py
sat/model/official/glm130B_model.py
sat/model/official/glm4v_model.py
sat/model/official/glm_model.py
sat/model/official/gpt2_model.py
sat/model/official/gptneo_model.py
sat/model/official/llama_model.py
sat/model/official/mae_model.py
sat/model/official/mixtral_model.py
sat/model/official/roberta_model.py
sat/model/official/t5_model.py
sat/model/official/vit_model.py
sat/model/official/yolos_model.py
sat/model/position_embedding/__init__.py
sat/model/position_embedding/rotary_embeddings.py
sat/model/position_embedding/rotary_embeddings_original.py
sat/model/position_embedding/sincos2d.py
sat/model/position_embedding/triton_rotary.py
sat/model/position_embedding/triton_rotary_embeddings.py
sat/model/position_embedding/vision_rotary_embeddings.py
sat/mpu/__init__.py
sat/mpu/cross_entropy.py
sat/mpu/data.py
sat/mpu/initialize.py
sat/mpu/layers.py
sat/mpu/mappings.py
sat/mpu/operation.py
sat/mpu/utils.py
sat/ops/__init__.py
sat/ops/fused_ema_adam.py
sat/ops/layernorm.py
sat/ops/local_attention_function.py
sat/ops/memory_efficient_attention.py
sat/ops/scaled_mask_softmax.py
sat/ops/csrc/adam/fused_ema_adam_frontend.cpp
sat/ops/csrc/adam/multi_tensor_apply.cuh
sat/ops/csrc/adam/multi_tensor_ema_adam.cu
sat/ops/csrc/includes/compat.h
sat/ops/csrc/includes/type_shim.h
sat/ops/ops_builder/__init__.py
sat/ops/ops_builder/builder.py
sat/ops/ops_builder/fused_ema_adam.py
sat/quantization/__init__.py
sat/quantization/kernels.py
sat/resources/__init__.py
sat/resources/download.py
sat/resources/urls.py
sat/tokenization/__init__.py
sat/tokenization/hf_tokenizer.py
sat/tokenization/cogview/__init__.py
sat/tokenization/cogview/sp_tokenizer.py
sat/tokenization/cogview/templates.py
sat/tokenization/cogview/unified_tokenizer.py
sat/tokenization/cogview/vqvae_tokenizer.py
sat/tokenization/cogview/vqvae/__init__.py
sat/tokenization/cogview/vqvae/api.py
sat/tokenization/cogview/vqvae/vqvae_diffusion.py
sat/tokenization/cogview/vqvae/vqvae_zc.py
sat/tokenization/embed_assets/chinese_sentencepiece/cog-pretrain.model
sat/tokenization/embed_assets/chinese_sentencepiece/cog-pretrain.vocab
sat/tokenization/embed_assets/english_tokenizer/bert-base-uncased-vocab.txt
sat/tokenization/embed_assets/english_tokenizer/bert-large-uncased-vocab.txt
sat/tokenization/embed_assets/english_tokenizer/gpt2-merges.txt
sat/tokenization/embed_assets/english_tokenizer/gpt2-vocab.json
sat/tokenization/embed_assets/english_tokenizer/roberta-merges.txt
sat/tokenization/embed_assets/english_tokenizer/roberta-vocab.json
sat/tokenization/glm/__init__.py
sat/tokenization/glm/sp_tokenizer.py
sat/tokenization/glm/tokenization.py
sat/tokenization/glm/tokenization_gpt2.py
sat/tokenization/glm/tokenization_wordpiece.py
sat/tokenization/icetk_glm_130B/__init__.py
sat/tokenization/icetk_glm_130B/ice_tokenizer.py
sat/tokenization/icetk_glm_130B/tokenizer.py
sat/training/__init__.py
sat/training/deepspeed_training.py
sat/training/deepspeed_zero0.json
sat/training/deepspeed_zero1.json
sat/training/deepspeed_zero2.json
sat/training/learning_rates.py
sat/training/model_io.py
sat/training/utils.py
tests/test_base_model.py
tests/test_inference.py
tests/test_jsonlds.py
tests/test_list_info.py
tests/test_mea.py
tests/test_model_parallel.py
tests/test_multi_webds.py
tests/test_nested_model.py
tests/test_read_img.py
tests/test_remote_data.py
tests/test_speed.py
tests/test_train.py
tests/test_train_dp.py
tests/test_train_nested.py
tests/test_triton_rotary_embedding.py