Index A | B | C | D | E | F | G | H | I | K | L | M | N | O | P | Q | R | S | T | U | V | W A add_error() (fairseq2.utils.validation.ValidationResult method) add_sub_result() (fairseq2.utils.validation.ValidationResult method) AdditiveResidualConnect (class in fairseq2.nn) all_gather() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) all_gather_to_list() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) all_reduce() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) all_sum() (in module fairseq2.gang) apply_mask() (in module fairseq2.nn.utils.mask) as_process_group() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) B barrier() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) BasicModelCheckpointLoader (class in fairseq2.model_checkpoint) BatchLayout (class in fairseq2.nn) boh_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) bos_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) broadcast() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) broadcast_flag() (in module fairseq2.gang) broadcast_objects() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) C capacity_bytes() (fairseq2.nn.IncrementalState method) (fairseq2.nn.IncrementalStateBag method) capacity_increment (fairseq2.nn.IncrementalStateBag property) close() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gangs method) (fairseq2.gang.ProcessGroupGang method) compiled_max_seq_len (fairseq2.nn.BatchLayout attribute) compute_row_mask() (in module fairseq2.nn.utils.mask) convert_qwen_state_dict() (in module fairseq2.models.qwen) create_decoder() (fairseq2.data.tokenizers.Tokenizer method) (fairseq2.models.qwen.QwenFactory method) (fairseq2.models.qwen.QwenTokenizer method) create_decoder_frontend() (fairseq2.models.qwen.QwenFactory method) create_decoder_layer() (fairseq2.models.qwen.QwenFactory method) create_default_process_group() (fairseq2.gang.ProcessGroupGang class method) create_embedding() (fairseq2.models.qwen.QwenFactory method) create_encoder() (fairseq2.data.tokenizers.Tokenizer method) (fairseq2.models.qwen.QwenTokenizer method) create_fake_gangs() (in module fairseq2.gang) create_ffn() (fairseq2.models.qwen.QwenFactory method) create_final_projection() (fairseq2.models.qwen.QwenFactory method) create_fsdp_gangs() (in module fairseq2.gang) create_gang() (fairseq2.gang.FakeGang method) (fairseq2.gang.Gang method) (fairseq2.gang.ProcessGroupGang method) create_layer_norm() (fairseq2.models.qwen.QwenFactory method) create_model() (fairseq2.models.qwen.QwenFactory method) create_new_model() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) create_parallel_gangs() (in module fairseq2.gang) create_position_encoder() (fairseq2.models.qwen.QwenFactory method) create_qwen_model() (in module fairseq2.models.qwen) create_raw_encoder() (fairseq2.data.tokenizers.Tokenizer method) (fairseq2.models.qwen.QwenTokenizer method) create_self_attention() (fairseq2.models.qwen.QwenFactory method) CudaContext (class in fairseq2.device) D DatasetFamilyNotKnownError DatasetHub (class in fairseq2.datasets.hub) DatasetHubAccessor (class in fairseq2.datasets.hub) DatasetNotKnownError decode_from_tokens() (fairseq2.data.tokenizers.TokenDecoder method) DelegatingModelCheckpointLoader (class in fairseq2.model_checkpoint) device (fairseq2.gang.FakeGang property) (fairseq2.gang.Gang property) (fairseq2.gang.ProcessGroupGang property) device_count() (fairseq2.device.CudaContext method) (fairseq2.device.StandardCudaContext method) dp (fairseq2.gang.Gangs attribute) dropout_p (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) E Embedding (class in fairseq2.nn) encode_as_tokens() (fairseq2.data.tokenizers.TokenEncoder method) eoh_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) eos_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) errors (fairseq2.utils.validation.ValidationResult property) export_qwen() (in module fairseq2.models.qwen) extra_repr() (fairseq2.nn.RMSNorm method) (fairseq2.nn.StandardLayerNorm method) F fairseq2.assets module fairseq2.device module fairseq2.gang module fairseq2.model_checkpoint module fairseq2.models module fairseq2.recipe.optim module fairseq2.utils.validation module FakeGang (class in fairseq2.gang) ffn_inner_dim (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) ffn_inner_dim_multiple_of (fairseq2.models.llama.LLaMAConfig attribute) ffn_inner_dim_multiplier (fairseq2.models.llama.LLaMAConfig attribute) ffn_inner_dim_scale (fairseq2.models.llama.LLaMAConfig attribute) forward() (fairseq2.nn.AdditiveResidualConnect method) (fairseq2.nn.Embedding method) (fairseq2.nn.LayerNorm method) (fairseq2.nn.LearnedPositionEncoder method) (fairseq2.nn.Linear method) (fairseq2.nn.PositionEncoder method) (fairseq2.nn.Projection method) (fairseq2.nn.ResidualConnect method) (fairseq2.nn.RMSNorm method) (fairseq2.nn.RotaryEncoder method) (fairseq2.nn.ScaledResidualConnect method) (fairseq2.nn.ShardedEmbedding method) (fairseq2.nn.SinusoidalPositionEncoder method) (fairseq2.nn.StandardEmbedding method) (fairseq2.nn.StandardLayerNorm method) (fairseq2.nn.TiedProjection method) from_embedding() (fairseq2.nn.ShardedEmbedding static method) G Gang (class in fairseq2.gang) GangError (class in fairseq2.gang) Gangs (class in fairseq2.gang) get_arch_config() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) get_archs() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) get_current_device() (in module fairseq2.device) get_dataset_config() (fairseq2.datasets.hub.DatasetHub method) get_default_device() (in module fairseq2.device) get_device_properties() (fairseq2.device.CudaContext method) (fairseq2.device.StandardCudaContext method) get_model_config() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) get_qwen_shard_specs() (in module fairseq2.models.qwen) get_qwen_tokenizer_hub() (in module fairseq2.models.qwen) get_shard_dims() (fairseq2.nn.ShardedEmbedding method) get_std_scale_factor() (fairseq2.models.qwen.QwenFactory method) get_tokenizer_config() (fairseq2.data.tokenizers.hub.TokenizerHub method) H has_error() (fairseq2.utils.validation.ValidationResult method) head_dim (fairseq2.models.qwen.QwenConfig attribute) I impl (fairseq2.models.llama.LLaMATokenizerConfig attribute) increment_step_nr() (fairseq2.nn.IncrementalStateBag method) IncrementalState (class in fairseq2.nn) IncrementalStateBag (class in fairseq2.nn) init_scaled_embedding() (in module fairseq2.nn) init_std (fairseq2.models.llama.LLaMAConfig attribute) init_std_scale (fairseq2.models.llama.LLaMAConfig attribute) is_available() (fairseq2.device.CudaContext method) (fairseq2.device.StandardCudaContext method) iter_cards() (fairseq2.data.tokenizers.hub.TokenizerHub method) (fairseq2.datasets.hub.DatasetHub method) (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) iter_checkpoint() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) K k_norm (fairseq2.models.qwen.QwenConfig attribute) L LayerNorm (class in fairseq2.nn) lazy_load() (fairseq2.model_checkpoint.BasicModelCheckpointLoader method) (fairseq2.model_checkpoint.DelegatingModelCheckpointLoader method) (fairseq2.model_checkpoint.ModelCheckpointLoader method) (fairseq2.model_checkpoint.NativeModelCheckpointLoader method) (fairseq2.model_checkpoint.SafetensorsCheckpointLoader method) LearnedPositionEncoder (class in fairseq2.nn) Linear (class in fairseq2.nn) LLaMAConfig (class in fairseq2.models.llama) LLaMATokenizerConfig (class in fairseq2.models.llama) load_custom_model() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) load_custom_tokenizer() (fairseq2.data.tokenizers.hub.TokenizerHub method) load_model() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) (in module fairseq2.models) (in module fairseq2.models.hub) load_tokenizer() (fairseq2.data.tokenizers.hub.TokenizerHub method) (in module fairseq2.data.tokenizers.hub) LocalRankOutOfRangeError (class in fairseq2.device) M MAX (fairseq2.gang.ReduceOperation attribute) max_num_steps (fairseq2.nn.IncrementalStateBag property) max_seq_len (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) (fairseq2.nn.BatchLayout property) maybe_get_arch_config() (fairseq2.models.hub.ModelHub method) (fairseq2.models.ModelHub method) maybe_get_current_gangs() (in module fairseq2.gang) maybe_get_state() (fairseq2.nn.IncrementalStateBag method) maybe_raise_param_group_length_error() (in module fairseq2.recipe.optim) MEAN (fairseq2.gang.ReduceOperation attribute) memory_stats() (fairseq2.device.CudaContext method) (fairseq2.device.StandardCudaContext method) MIN (fairseq2.gang.ReduceOperation attribute) min_seq_len (fairseq2.nn.BatchLayout property) model_dim (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) ModelArchitectureNotKnownError (class in fairseq2.models) ModelCheckpointError (class in fairseq2.model_checkpoint) ModelCheckpointLoader (class in fairseq2.model_checkpoint) ModelFamilyNotKnownError (class in fairseq2.models) ModelHub (class in fairseq2.models) (class in fairseq2.models.hub) ModelHubAccessor (class in fairseq2.models) (class in fairseq2.models.hub) ModelNotKnownError (class in fairseq2.models) module fairseq2.assets fairseq2.device fairseq2.gang fairseq2.model_checkpoint fairseq2.models fairseq2.recipe.optim fairseq2.utils.validation N NativeModelCheckpointLoader (class in fairseq2.model_checkpoint) num_attn_heads (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) num_key_value_heads (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) num_layers (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) O ObjectValidator (class in fairseq2.utils.validation) of() (fairseq2.nn.BatchLayout static method) open_custom_dataset() (fairseq2.datasets.hub.DatasetHub method) open_dataset() (fairseq2.datasets.hub.DatasetHub method) P packed (fairseq2.nn.BatchLayout property) pad_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) (fairseq2.models.llama.LLaMAConfig attribute) padded (fairseq2.nn.BatchLayout property) position_indices (fairseq2.nn.BatchLayout property) PositionEncoder (class in fairseq2.nn) pp (fairseq2.gang.Gangs attribute) prefix_indices (fairseq2.data.tokenizers.TokenEncoder property) prepare_parameter_groups() (in module fairseq2.recipe.optim) ProcessGroupGang (class in fairseq2.gang) PRODUCT (fairseq2.gang.ReduceOperation attribute) Projection (class in fairseq2.nn) Q q_norm (fairseq2.models.qwen.QwenConfig attribute) qkv_proj_bias (fairseq2.models.qwen.QwenConfig attribute) QWEN_FAMILY (in module fairseq2.models.qwen) QwenConfig (class in fairseq2.models.qwen) QwenFactory (class in fairseq2.models.qwen) QwenTokenizer (class in fairseq2.models.qwen) QwenTokenizerConfig (class in fairseq2.models.qwen) R raise_operational_gang_error() (in module fairseq2.gang) rank (fairseq2.gang.FakeGang property) (fairseq2.gang.Gang property) (fairseq2.gang.ProcessGroupGang property) rdp (fairseq2.gang.Gangs attribute) ReduceOperation (class in fairseq2.gang) reorder() (fairseq2.nn.IncrementalState method) (fairseq2.nn.IncrementalStateBag method) reset_non_persistent_buffers() (fairseq2.nn.RotaryEncoder method) (fairseq2.nn.SinusoidalPositionEncoder method) reset_parameters() (fairseq2.nn.LearnedPositionEncoder method) (fairseq2.nn.Linear method) (fairseq2.nn.RMSNorm method) (fairseq2.nn.RotaryEncoder method) (fairseq2.nn.ShardedEmbedding method) (fairseq2.nn.SinusoidalPositionEncoder method) (fairseq2.nn.StandardEmbedding method) (fairseq2.nn.StandardLayerNorm method) reset_peak_memory_stats() (fairseq2.device.CudaContext method) (fairseq2.device.StandardCudaContext method) reshard_tensor() (in module fairseq2.model_checkpoint) ResidualConnect (class in fairseq2.nn) result (fairseq2.utils.validation.ValidationError attribute) RMSNorm (class in fairseq2.nn) root (fairseq2.gang.Gangs attribute) rope_scale (fairseq2.models.llama.LLaMAConfig attribute) rope_theta (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) RotaryEncoder (class in fairseq2.nn) S SafetensorsCheckpointLoader (class in fairseq2.model_checkpoint) ScaledResidualConnect (class in fairseq2.nn) sdp (fairseq2.gang.Gangs attribute) seq_begin_indices (fairseq2.nn.BatchLayout property) seq_begin_indices_pt (fairseq2.nn.BatchLayout property) seq_lens (fairseq2.nn.BatchLayout property) seq_lens_pt (fairseq2.nn.BatchLayout property) set_state() (fairseq2.nn.IncrementalStateBag method) shard_embed_dim (fairseq2.models.llama.LLaMAConfig attribute) ShardedEmbedding (class in fairseq2.nn) SinusoidalPositionEncoder (class in fairseq2.nn) size (fairseq2.data.tokenizers.VocabularyInfo attribute) (fairseq2.gang.FakeGang property) (fairseq2.gang.Gang property) (fairseq2.gang.ProcessGroupGang property) size_bytes() (fairseq2.nn.IncrementalState method) (fairseq2.nn.IncrementalStateBag method) split_regex (fairseq2.models.llama.LLaMATokenizerConfig attribute) StandardCudaContext (class in fairseq2.device) StandardEmbedding (class in fairseq2.nn) StandardLayerNorm (class in fairseq2.nn) StandardObjectValidator (class in fairseq2.utils.validation) step_nr (fairseq2.nn.IncrementalStateBag property) sub_results (fairseq2.utils.validation.ValidationResult property) suffix_indices (fairseq2.data.tokenizers.TokenEncoder property) SUM (fairseq2.gang.ReduceOperation attribute) supports_path() (fairseq2.model_checkpoint.BasicModelCheckpointLoader method) (fairseq2.model_checkpoint.DelegatingModelCheckpointLoader method) (fairseq2.model_checkpoint.ModelCheckpointLoader method) (fairseq2.model_checkpoint.NativeModelCheckpointLoader method) (fairseq2.model_checkpoint.SafetensorsCheckpointLoader method) supports_process_group (fairseq2.gang.FakeGang property) (fairseq2.gang.Gang property) (fairseq2.gang.ProcessGroupGang property) SupportsDeviceTransfer (class in fairseq2.device) T tied_embeddings (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) TiedProjection (class in fairseq2.nn) to() (fairseq2.device.SupportsDeviceTransfer method) to_embedding() (fairseq2.nn.ShardedEmbedding method) TokenDecoder (class in fairseq2.data.tokenizers) TokenEncoder (class in fairseq2.data.tokenizers) Tokenizer (class in fairseq2.data.tokenizers) TokenizerFamilyNotKnownError TokenizerHub (class in fairseq2.data.tokenizers.hub) TokenizerHubAccessor (class in fairseq2.data.tokenizers.hub) TokenizerNotKnownError tp (fairseq2.gang.Gangs attribute) U unk_idx (fairseq2.data.tokenizers.VocabularyInfo attribute) use_eot (fairseq2.models.llama.LLaMATokenizerConfig attribute) use_im_end (fairseq2.models.qwen.QwenTokenizerConfig attribute) use_scaled_rope (fairseq2.models.llama.LLaMAConfig attribute) V Validatable (class in fairseq2.utils.validation) validate() (fairseq2.utils.validation.ObjectValidator method) (fairseq2.utils.validation.StandardObjectValidator method) (fairseq2.utils.validation.Validatable method) ValidationError ValidationResult (class in fairseq2.utils.validation) vocab_info (fairseq2.data.tokenizers.Tokenizer property) (fairseq2.models.qwen.QwenTokenizer property) vocab_size (fairseq2.models.llama.LLaMAConfig attribute) (fairseq2.models.qwen.QwenConfig attribute) VocabularyInfo (class in fairseq2.data.tokenizers) W width (fairseq2.nn.BatchLayout property)