LICENSE
README.md
pyproject.toml
src/modalities/__init__.py
src/modalities/__main__.py
src/modalities/activation_checkpointing.py
src/modalities/batch.py
src/modalities/evaluator.py
src/modalities/exceptions.py
src/modalities/gym.py
src/modalities/loss_functions.py
src/modalities/trainer.py
src/modalities/util.py
src/modalities.egg-info/PKG-INFO
src/modalities.egg-info/SOURCES.txt
src/modalities.egg-info/dependency_links.txt
src/modalities.egg-info/entry_points.txt
src/modalities.egg-info/requires.txt
src/modalities.egg-info/top_level.txt
src/modalities/checkpointing/__init__.py
src/modalities/checkpointing/checkpoint_conversion.py
src/modalities/checkpointing/checkpoint_loading.py
src/modalities/checkpointing/checkpoint_saving.py
src/modalities/checkpointing/checkpoint_saving_execution.py
src/modalities/checkpointing/checkpoint_saving_instruction.py
src/modalities/checkpointing/checkpoint_saving_strategies.py
src/modalities/checkpointing/fsdp/__init__.py
src/modalities/checkpointing/fsdp/fsdp_checkpoint_loading.py
src/modalities/checkpointing/fsdp/fsdp_checkpoint_saving.py
src/modalities/checkpointing/torch/__init__.py
src/modalities/checkpointing/torch/torch_checkpoint_loading.py
src/modalities/checkpointing/torch/torch_checkpoint_saving.py
src/modalities/config/__init__.py
src/modalities/config/component_factory.py
src/modalities/config/config.py
src/modalities/config/instantiation_models.py
src/modalities/config/lookup_enum.py
src/modalities/config/pydanctic_if_types.py
src/modalities/config/utils.py
src/modalities/dataloader/__init__.py
src/modalities/dataloader/create_index.py
src/modalities/dataloader/create_packed_data.py
src/modalities/dataloader/dataloader.py
src/modalities/dataloader/dataloader_factory.py
src/modalities/dataloader/dataset.py
src/modalities/dataloader/dataset_factory.py
src/modalities/dataloader/large_file_lines_reader.py
src/modalities/dataloader/samplers.py
src/modalities/inference/__init__.py
src/modalities/inference/inference.py
src/modalities/inference/text/__init__.py
src/modalities/inference/text/config.py
src/modalities/inference/text/inference_component.py
src/modalities/logging_broker/__init__.py
src/modalities/logging_broker/message_broker.py
src/modalities/logging_broker/messages.py
src/modalities/logging_broker/publisher.py
src/modalities/logging_broker/subscriber.py
src/modalities/logging_broker/subscriber_impl/__init__.py
src/modalities/logging_broker/subscriber_impl/batch_progress_subscriber.py
src/modalities/logging_broker/subscriber_impl/results_subscriber.py
src/modalities/logging_broker/subscriber_impl/subscriber_factory.py
src/modalities/models/__init__.py
src/modalities/models/model.py
src/modalities/models/model_factory.py
src/modalities/models/utils.py
src/modalities/models/coca/__init__.py
src/modalities/models/coca/attention_pooling.py
src/modalities/models/coca/coca_model.py
src/modalities/models/coca/collator.py
src/modalities/models/coca/multi_modal_decoder.py
src/modalities/models/coca/text_decoder.py
src/modalities/models/components/__init__.py
src/modalities/models/components/layer_norms.py
src/modalities/models/gpt2/__init__.py
src/modalities/models/gpt2/collator.py
src/modalities/models/gpt2/gpt2_model.py
src/modalities/models/gpt2/pretrained_gpt_model.py
src/modalities/models/huggingface/__init__.py
src/modalities/models/huggingface/huggingface_model.py
src/modalities/models/huggingface_adapters/__init__.py
src/modalities/models/huggingface_adapters/hf_adapter.py
src/modalities/models/vision_transformer/__init__.py
src/modalities/models/vision_transformer/vision_transformer_model.py
src/modalities/nn/__init__.py
src/modalities/nn/attention.py
src/modalities/nn/mlp.py
src/modalities/nn/model_initialization/__init__.py
src/modalities/nn/model_initialization/composed_initialization.py
src/modalities/nn/model_initialization/initialization_if.py
src/modalities/nn/model_initialization/initialization_routines.py
src/modalities/nn/model_initialization/parameter_name_filters.py
src/modalities/optimizers/__init__.py
src/modalities/optimizers/lr_schedulers.py
src/modalities/optimizers/optimizer_factory.py
src/modalities/registry/__init__.py
src/modalities/registry/components.py
src/modalities/registry/registry.py
src/modalities/running_env/__init__.py
src/modalities/running_env/cuda_env.py
src/modalities/running_env/env_utils.py
src/modalities/running_env/fsdp/__init__.py
src/modalities/running_env/fsdp/fsdp_auto_wrapper.py
src/modalities/running_env/fsdp/reducer.py
src/modalities/tokenization/__init__.py
src/modalities/tokenization/tokenizer_wrapper.py
src/modalities/training/__init__.py
src/modalities/training/gradient_clipping/__init__.py
src/modalities/training/gradient_clipping/fsdp_gradient_clipper.py
src/modalities/training/gradient_clipping/fsdp_gradient_clipper_config.py
src/modalities/training/gradient_clipping/gradient_clipper.py
src/modalities/utils/mfu.py
src/modalities/utils/number_conversion.py
tests/test_evaluator.py
tests/test_gym.py
tests/test_initialization.py
tests/test_loss_functions.py
tests/test_lr_scheduler.py
tests/test_main.py
tests/test_optimizer_factory.py
tests/test_rotary_qkv_transform.py
tests/test_tokenization.py
tests/test_utils.py
tests/tests.py