API Reference#
This page contains auto-generated API reference documentation [1].
- xlstm_jax
- xlstm_jax.common_types
- xlstm_jax.configs
- xlstm_jax.dataset
- xlstm_jax.dataset.batch
- xlstm_jax.dataset.configs
- xlstm_jax.dataset.grain_batch_rampup
- xlstm_jax.dataset.grain_data_processing
- xlstm_jax.dataset.grain_iterator
- xlstm_jax.dataset.grain_transforms
- xlstm_jax.dataset.hf_tokenizer
- xlstm_jax.dataset.input_pipeline_interface
- xlstm_jax.dataset.lmeval_dataset
- xlstm_jax.dataset.lmeval_pipeline
- xlstm_jax.dataset.multihost_dataloading
- xlstm_jax.dataset.synthetic_dataloading
- xlstm_jax.define_hydra_schemas
- xlstm_jax.distributed
- xlstm_jax.import_utils
- xlstm_jax.kernels
- xlstm_jax.kernels.kernel_utils
- xlstm_jax.kernels.mlstm_chunkwise
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v3
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v3noslice
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize._chunkwise_gates
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize._combined_bw
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize._combined_fw
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize._parallel_bw_dK
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize._parallel_bw_dQ
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize._parallel_bw_dV
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize._parallel_fw
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize._recurrent_bw
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize._recurrent_fw
- xlstm_jax.kernels.mlstm_chunkwise.max_triton_fwbw_v5xlchunksize.triton_fwbw
- xlstm_jax.kernels.mlstm_chunkwise.triton_stablef
- xlstm_jax.kernels.mlstm_recurrent
- xlstm_jax.kernels.stride_utils
- xlstm_jax.main_train
- xlstm_jax.models
- xlstm_jax.models.configs
- xlstm_jax.models.llama
- xlstm_jax.models.shared
- xlstm_jax.models.xlstm_clean
- xlstm_jax.models.xlstm_clean.blocks
- xlstm_jax.models.xlstm_clean.components
- xlstm_jax.models.xlstm_clean.utils
- xlstm_jax.models.xlstm_clean.xlstm_block_stack
- xlstm_jax.models.xlstm_clean.xlstm_lm_model
- xlstm_jax.models.xlstm_parallel
- xlstm_jax.models.xlstm_parallel.benchmark
- xlstm_jax.models.xlstm_parallel.blocks
- xlstm_jax.models.xlstm_parallel.blocks.mlstm
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend.attention
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend.config
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend.config_utils
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend.fwbw
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend.layer_factory
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend.recurrent
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend.recurrent_triton
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend.simple
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend.triton_kernels
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend_utils
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.block
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.cell
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.layer
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.layer_v1
- xlstm_jax.models.xlstm_parallel.blocks.mlstm.backend
- xlstm_jax.models.xlstm_parallel.blocks.xlstm_block
- xlstm_jax.models.xlstm_parallel.blocks.mlstm
- xlstm_jax.models.xlstm_parallel.checkpointing
- xlstm_jax.models.xlstm_parallel.components
- xlstm_jax.models.xlstm_parallel.training
- xlstm_jax.models.xlstm_parallel.utils
- xlstm_jax.models.xlstm_parallel.xlstm_block_stack
- xlstm_jax.models.xlstm_parallel.xlstm_lm_model
- xlstm_jax.models.xlstm_pytorch
- xlstm_jax.models.xlstm_pytorch.blocks
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.backend
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.backend.config
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.backend.config_utils
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.backend.fwbw
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.backend.layer_factory
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.backend.simple
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.backend.tl_utils
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.backend.triton_chunk
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.block
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.cell
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.layer
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm.backend
- xlstm_jax.models.xlstm_pytorch.blocks.slstm
- xlstm_jax.models.xlstm_pytorch.blocks.xlstm_block
- xlstm_jax.models.xlstm_pytorch.blocks.mlstm
- xlstm_jax.models.xlstm_pytorch.components
- xlstm_jax.models.xlstm_pytorch.utils
- xlstm_jax.models.xlstm_pytorch.xlstm_block_stack
- xlstm_jax.models.xlstm_pytorch.xlstm_lm_model
- xlstm_jax.models.xlstm_pytorch.blocks
- xlstm_jax.resume_training
- xlstm_jax.start_training
- xlstm_jax.train_init_fns
- xlstm_jax.trainer
- xlstm_jax.utils
- lmeval_extended_evaluation