Index A | B | C | D | E | F | G | H | I | K | L | M | N | O | P | Q | R | S | T | U | V | W A add_error() (fairseq2.utils.validation.ValidationResult method) add_sub_result() (fairseq2.utils.validation.ValidationResult method) AdditiveResidualConnect (class in fairseq2.nn) all_gather() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) all_gather_to_list() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) all_reduce() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) all_sum() (in module fairseq2.gang) apply_mask() (in module fairseq2.nn.utils.mask) arch (fairseq2.models.hg.HuggingFaceConfig attribute) as_process_group() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) B barrier() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) BatchLayout (class in fairseq2.nn) boh_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) bos_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) broadcast() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) broadcast_flag() (in module fairseq2.gang) broadcast_objects() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) C capacity_bytes() (fairseq2.nn.IncrementalState method) (fairseq2.nn.IncrementalStateBag method) capacity_increment (fairseq2.nn.IncrementalStateBag property) clip_grad_norm() (fairseq2.nn.data_parallel.DataParallelFacade method) close() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gangs method) (fairseq2.gang.ProcessGroupGang method) compiled_max_seq_len (fairseq2.nn.BatchLayout attribute) compute_row_mask() (in module fairseq2.nn.utils.mask) CorruptModelCheckpointError (class in fairseq2.model_checkpoint) create_decoder() (fairseq2.data.tokenizers.Tokenizer method) (fairseq2.models.qwen.QwenTokenizer method) create_default_process_group() (fairseq2.gang.ProcessGroupGang class method) create_encoder() (fairseq2.data.tokenizers.Tokenizer method) (fairseq2.models.qwen.QwenTokenizer method) create_fake_gangs() (in module fairseq2.gang) create_fsdp_gangs() (in module fairseq2.gang) create_gang() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) create_new_model() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) create_parallel_gangs() (in module fairseq2.gang) create_raw_encoder() (fairseq2.data.tokenizers.Tokenizer method) (fairseq2.models.qwen.QwenTokenizer method) CudaContext (class in fairseq2.device) D data (fairseq2.models.hg.HuggingFaceConfig attribute) DataParallelFacade (class in fairseq2.nn.data_parallel) DatasetHub (class in fairseq2.datasets.hub) DatasetHubAccessor (class in fairseq2.datasets.hub) DataTypeContext (class in fairseq2.data_type) decode_from_tokens() (fairseq2.data.tokenizers.TokenDecoder method) detect_default_device() (in module fairseq2.device) device (fairseq2.gang.FakeGang property) (fairseq2.gang.Gang property) (fairseq2.gang.Gangs property) (fairseq2.gang.ProcessGroupGang property) device_count() (fairseq2.device.CudaContext method) DeviceContext (class in fairseq2.device) dp (fairseq2.gang.Gangs attribute) dropout_p (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) E Embedding (class in fairseq2.nn) encode_as_tokens() (fairseq2.data.tokenizers.TokenEncoder method) eoh_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) eos_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) errors (fairseq2.utils.validation.ValidationResult property) extra_repr() (fairseq2.nn.RMSNorm method) (fairseq2.nn.StandardLayerNorm method) F fairseq2 module fairseq2.assets module fairseq2.data_type module fairseq2.device module fairseq2.gang module fairseq2.model_checkpoint module fairseq2.models module fairseq2.models.hg module fairseq2.recipe.composition module fairseq2.recipe.optim module fairseq2.utils.validation module FakeGang (class in fairseq2.gang) ffn_inner_dim (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) ffn_inner_dim_multiple_of (fairseq2.models.llama.LLaMAConfig attribute) ffn_inner_dim_multiplier (fairseq2.models.llama.LLaMAConfig attribute) ffn_inner_dim_scale (fairseq2.models.llama.LLaMAConfig attribute) forward() (fairseq2.nn.AdditiveResidualConnect method) (fairseq2.nn.Embedding method) (fairseq2.nn.LayerNorm method) (fairseq2.nn.LearnedPositionEncoder method) (fairseq2.nn.Linear method) (fairseq2.nn.PositionEncoder method) (fairseq2.nn.Projection method) (fairseq2.nn.ResidualConnect method) (fairseq2.nn.RMSNorm method) (fairseq2.nn.RotaryEncoder method) (fairseq2.nn.ScaledResidualConnect method) (fairseq2.nn.ShardedEmbedding method) (fairseq2.nn.SinusoidalPositionEncoder method) (fairseq2.nn.StandardEmbedding method) (fairseq2.nn.StandardLayerNorm method) (fairseq2.nn.TiedProjection method) from_embedding() (fairseq2.nn.ShardedEmbedding static method) G Gang (class in fairseq2.gang) GangContext (class in fairseq2.gang) GangError (class in fairseq2.gang) Gangs (class in fairseq2.gang) gangs (fairseq2.model_checkpoint.ModelCheckpointLoadOptions attribute) get_arch_config() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) get_archs() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) get_current_device() (fairseq2.device.DeviceContext method) (in module fairseq2.device) get_current_dtype() (fairseq2.data_type.DataTypeContext method) (in module fairseq2.data_type) get_current_gangs() (fairseq2.gang.GangContext method) (in module fairseq2.gang) get_data_parallel_facade() (in module fairseq2.nn.data_parallel) get_dataset_config() (fairseq2.datasets.hub.DatasetHub method) get_default_gangs() (in module fairseq2.gang) get_device_properties() (fairseq2.device.CudaContext method) get_hugging_face_converter() (in module fairseq2.models.hg) get_model_checkpoint_loader() (in module fairseq2.model_checkpoint) get_model_config() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) get_qwen_tokenizer_hub() (in module fairseq2.models.qwen) get_shard_dims() (fairseq2.nn.ShardedEmbedding method) get_tokenizer_config() (fairseq2.data.tokenizers.hub.TokenizerHub method) H has_error() (fairseq2.utils.validation.ValidationResult method) head_dim (fairseq2.models.qwen.QwenConfig attribute) HuggingFaceConfig (class in fairseq2.models.hg) HuggingFaceConverter (class in fairseq2.models.hg) I impl (fairseq2.models.llama.LLaMATokenizerConfig attribute) increment_step_nr() (fairseq2.nn.IncrementalStateBag method) IncrementalState (class in fairseq2.nn) IncrementalStateBag (class in fairseq2.nn) init_scaled_embedding() (in module fairseq2.nn) init_std (fairseq2.models.llama.LLaMAConfig attribute) init_std_scale (fairseq2.models.llama.LLaMAConfig attribute) is_available() (fairseq2.device.CudaContext method) iter_cards() (fairseq2.data.tokenizers.hub.TokenizerHub method) (fairseq2.datasets.hub.DatasetHub method) (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) iter_checkpoint() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) K k_norm (fairseq2.models.qwen.QwenConfig attribute) kls_name (fairseq2.models.hg.HuggingFaceConfig attribute) L LayerNorm (class in fairseq2.nn) lazy_load() (fairseq2.model_checkpoint.ModelCheckpointLoader method) LearnedPositionEncoder (class in fairseq2.nn) Linear (class in fairseq2.nn) LLaMAConfig (class in fairseq2.models.llama) LLaMATokenizerConfig (class in fairseq2.models.llama) load_custom_model() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) load_custom_tokenizer() (fairseq2.data.tokenizers.hub.TokenizerHub method) load_model() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) (in module fairseq2.models) (in module fairseq2.models.hub) load_state_dict() (fairseq2.nn.data_parallel.DataParallelFacade method) load_tokenizer() (fairseq2.data.tokenizers.hub.TokenizerHub method) (in module fairseq2.data.tokenizers.hub) LocalRankOutOfRangeError (class in fairseq2.device) M MAX (fairseq2.gang.ReduceOperation attribute) max_num_steps (fairseq2.nn.IncrementalStateBag property) max_seq_len (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) (fairseq2.nn.BatchLayout property) maybe_get_arch_config() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) maybe_get_state() (fairseq2.nn.IncrementalStateBag method) maybe_raise_param_group_length_error() (in module fairseq2.recipe.optim) MEAN (fairseq2.gang.ReduceOperation attribute) memory_stats() (fairseq2.device.CudaContext method) MIN (fairseq2.gang.ReduceOperation attribute) min_seq_len (fairseq2.nn.BatchLayout property) mmap (fairseq2.model_checkpoint.ModelCheckpointLoadOptions attribute) model_dim (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) ModelArchitectureNotKnownError (class in fairseq2.models) ModelCheckpointLoader (class in fairseq2.model_checkpoint) ModelCheckpointLoadOptions (class in fairseq2.model_checkpoint) ModelFamilyNotKnownError (class in fairseq2.models) ModelHub (class in fairseq2.models) (class in fairseq2.models.hub) ModelHubAccessor (class in fairseq2.models) (class in fairseq2.models.hub) ModelNotKnownError (class in fairseq2.models) module fairseq2 fairseq2.assets fairseq2.data_type fairseq2.device fairseq2.gang fairseq2.model_checkpoint fairseq2.models fairseq2.models.hg fairseq2.recipe.composition fairseq2.recipe.optim fairseq2.utils.validation N no_sync() (fairseq2.nn.data_parallel.DataParallelFacade method) num_attn_heads (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) num_key_value_heads (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) num_layers (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) O ObjectValidator (class in fairseq2.utils.validation) of() (fairseq2.nn.BatchLayout static method) open_custom_dataset() (fairseq2.datasets.hub.DatasetHub method) open_dataset() (fairseq2.datasets.hub.DatasetHub method) P packed (fairseq2.nn.BatchLayout property) pad_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) (fairseq2.models.llama.LLaMAConfig attribute) padded (fairseq2.nn.BatchLayout property) position_indices (fairseq2.nn.BatchLayout property) PositionEncoder (class in fairseq2.nn) pp (fairseq2.gang.Gangs attribute) prefix_indices (fairseq2.data.tokenizers.TokenEncoder property) prepare_parameter_groups() (in module fairseq2.recipe.optim) ProcessGroupGang (class in fairseq2.gang) PRODUCT (fairseq2.gang.ReduceOperation attribute) Projection (class in fairseq2.nn) Q q_norm (fairseq2.models.qwen.QwenConfig attribute) qkv_proj_bias (fairseq2.models.qwen.QwenConfig attribute) QWEN_FAMILY (in module fairseq2.models.qwen) QwenConfig (class in fairseq2.models.qwen) QwenTokenizer (class in fairseq2.models.qwen) QwenTokenizerConfig (class in fairseq2.models.qwen) R rank (fairseq2.gang.FakeGang property) (fairseq2.gang.Gang property) (fairseq2.gang.ProcessGroupGang property) rdp (fairseq2.gang.Gangs attribute) ReduceOperation (class in fairseq2.gang) register_recipe_assets() (in module fairseq2.recipe.composition) reorder() (fairseq2.nn.IncrementalState method) (fairseq2.nn.IncrementalStateBag method) reset_non_persistent_buffers() (fairseq2.nn.RotaryEncoder method) (fairseq2.nn.SinusoidalPositionEncoder method) reset_parameters() (fairseq2.nn.LearnedPositionEncoder method) (fairseq2.nn.Linear method) (fairseq2.nn.RMSNorm method) (fairseq2.nn.RotaryEncoder method) (fairseq2.nn.ShardedEmbedding method) (fairseq2.nn.SinusoidalPositionEncoder method) (fairseq2.nn.StandardEmbedding method) (fairseq2.nn.StandardLayerNorm method) reset_peak_memory_stats() (fairseq2.device.CudaContext method) reshard_tensor() (in module fairseq2.model_checkpoint) ResidualConnect (class in fairseq2.nn) restrict (fairseq2.model_checkpoint.ModelCheckpointLoadOptions attribute) result (fairseq2.utils.validation.ValidationError attribute) RMSNorm (class in fairseq2.nn) root (fairseq2.gang.Gangs attribute) rope_scale (fairseq2.models.llama.LLaMAConfig attribute) rope_theta (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) RotaryEncoder (class in fairseq2.nn) S save_hugging_face_model() (in module fairseq2.models.hg) ScaledResidualConnect (class in fairseq2.nn) sdp (fairseq2.gang.Gangs attribute) seq_begin_indices (fairseq2.nn.BatchLayout property) seq_begin_indices_pt (fairseq2.nn.BatchLayout property) seq_lens (fairseq2.nn.BatchLayout property) seq_lens_pt (fairseq2.nn.BatchLayout property) set_data_parallel_facade() (in module fairseq2.nn.data_parallel) set_default_gangs() (in module fairseq2.gang) set_device() (fairseq2.device.DeviceContext method) (in module fairseq2.device) set_dtype() (fairseq2.data_type.DataTypeContext method) (in module fairseq2.data_type) set_gangs() (fairseq2.gang.GangContext method) (in module fairseq2.gang) set_state() (fairseq2.nn.IncrementalStateBag method) shard_embed_dim (fairseq2.models.llama.LLaMAConfig attribute) ShardedEmbedding (class in fairseq2.nn) SinusoidalPositionEncoder (class in fairseq2.nn) size (fairseq2.data.tokenizers.VocabularyInfo attribute) (fairseq2.gang.FakeGang property) (fairseq2.gang.Gang property) (fairseq2.gang.ProcessGroupGang property) size_bytes() (fairseq2.nn.IncrementalState method) (fairseq2.nn.IncrementalStateBag method) split_regex (fairseq2.models.llama.LLaMATokenizerConfig attribute) StandardEmbedding (class in fairseq2.nn) StandardLayerNorm (class in fairseq2.nn) StandardObjectValidator (class in fairseq2.utils.validation) state_dict() (fairseq2.nn.data_parallel.DataParallelFacade method) state_dict_converter (fairseq2.model_checkpoint.ModelCheckpointLoadOptions attribute) step_nr (fairseq2.nn.IncrementalStateBag property) sub_results (fairseq2.utils.validation.ValidationResult property) suffix_indices (fairseq2.data.tokenizers.TokenEncoder property) SUM (fairseq2.gang.ReduceOperation attribute) summon_full_parameters() (fairseq2.nn.data_parallel.DataParallelFacade method) supports_path() (fairseq2.model_checkpoint.ModelCheckpointLoader method) supports_process_group (fairseq2.gang.FakeGang property) (fairseq2.gang.Gang property) (fairseq2.gang.ProcessGroupGang property) SupportsDeviceTransfer (class in fairseq2.device) T tied_embeddings (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) TiedProjection (class in fairseq2.nn) to() (fairseq2.device.SupportsDeviceTransfer method) to_embedding() (fairseq2.nn.ShardedEmbedding method) to_hg_config() (fairseq2.models.hg.HuggingFaceConverter method) to_hg_state_dict() (fairseq2.models.hg.HuggingFaceConverter method) TokenDecoder (class in fairseq2.data.tokenizers) TokenEncoder (class in fairseq2.data.tokenizers) Tokenizer (class in fairseq2.data.tokenizers) TokenizerHub (class in fairseq2.data.tokenizers.hub) TokenizerHubAccessor (class in fairseq2.data.tokenizers.hub) tp (fairseq2.gang.Gangs attribute) U unk_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) use_eot (fairseq2.models.llama.LLaMATokenizerConfig attribute) use_im_end (fairseq2.models.qwen.QwenTokenizerConfig attribute) use_scaled_rope (fairseq2.models.llama.LLaMAConfig attribute) V Validatable (class in fairseq2.utils.validation) validate() (fairseq2.utils.validation.ObjectValidator method) (fairseq2.utils.validation.StandardObjectValidator method) (fairseq2.utils.validation.Validatable method) ValidationError ValidationResult (class in fairseq2.utils.validation) vocab_info (fairseq2.data.tokenizers.Tokenizer property) (fairseq2.models.qwen.QwenTokenizer property) vocab_size (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) VocabularyInfo (class in fairseq2.data.tokenizers) W width (fairseq2.nn.BatchLayout property)