LICENSE
README.md
pyproject.toml
fla/__init__.py
fla/utils.py
fla/modules/__init__.py
fla/modules/activations.py
fla/modules/convolution.py
fla/modules/feature_map.py
fla/modules/fused_bitlinear.py
fla/modules/fused_cross_entropy.py
fla/modules/fused_kl_div.py
fla/modules/fused_linear_cross_entropy.py
fla/modules/fused_norm_gate.py
fla/modules/grpo.py
fla/modules/l2norm.py
fla/modules/l2warp.py
fla/modules/layernorm.py
fla/modules/layernorm_gated.py
fla/modules/mlp.py
fla/modules/parallel.py
fla/modules/rotary.py
fla/modules/token_shift.py
fla/modules/conv/__init__.py
fla/modules/conv/causal_conv1d.py
fla/modules/conv/long_conv.py
fla/modules/conv/short_conv.py
fla/modules/conv/cp/__init__.py
fla/modules/conv/cp/ops.py
fla/modules/conv/cuda/__init__.py
fla/modules/conv/cuda/ops.py
fla/modules/conv/triton/__init__.py
fla/modules/conv/triton/kernels.py
fla/modules/conv/triton/ops.py
fla/ops/__init__.py
fla/ops/abc/__init__.py
fla/ops/abc/chunk.py
fla/ops/abc/naive.py
fla/ops/attn/__init__.py
fla/ops/attn/decoding.py
fla/ops/attn/naive.py
fla/ops/attn/parallel.py
fla/ops/backends/__init__.py
fla/ops/based/__init__.py
fla/ops/based/fused_chunk.py
fla/ops/based/naive.py
fla/ops/based/parallel.py
fla/ops/comba/__init__.py
fla/ops/comba/chunk.py
fla/ops/comba/fused_recurrent.py
fla/ops/comba/naive.py
fla/ops/comba/utils.py
fla/ops/comba/wy_fast.py
fla/ops/common/__init__.py
fla/ops/common/chunk_delta_h.py
fla/ops/common/chunk_h.py
fla/ops/common/chunk_h_parallel.py
fla/ops/common/chunk_h_split.py
fla/ops/common/chunk_o.py
fla/ops/common/chunk_scaled_dot_kkt.py
fla/ops/common/fused_chunk.py
fla/ops/common/fused_recurrent.py
fla/ops/common/intracard_cp.py
fla/ops/common/backends/__init__.py
fla/ops/common/backends/intracard.py
fla/ops/cp/__init__.py
fla/ops/cp/chunk_delta_h.py
fla/ops/cp/comm.py
fla/ops/cp/context.py
fla/ops/delta_rule/__init__.py
fla/ops/delta_rule/chunk.py
fla/ops/delta_rule/fused_chunk.py
fla/ops/delta_rule/fused_recurrent.py
fla/ops/delta_rule/naive.py
fla/ops/delta_rule/parallel.py
fla/ops/delta_rule/wy_fast.py
fla/ops/deltaformer/__init__.py
fla/ops/deltaformer/invcum.py
fla/ops/deltaformer/naive.py
fla/ops/deltaformer/parallel.py
fla/ops/forgetting_attn/__init__.py
fla/ops/forgetting_attn/naive.py
fla/ops/forgetting_attn/parallel.py
fla/ops/gated_delta_product/__init__.py
fla/ops/gated_delta_product/chunk.py
fla/ops/gated_delta_product/chunk_deltaproduct_h.py
fla/ops/gated_delta_product/chunk_deltaproduct_o.py
fla/ops/gated_delta_product/chunk_ref.py
fla/ops/gated_delta_product/naive.py
fla/ops/gated_delta_rule/__init__.py
fla/ops/gated_delta_rule/chunk.py
fla/ops/gated_delta_rule/fused_recurrent.py
fla/ops/gated_delta_rule/naive.py
fla/ops/gated_delta_rule/wy_fast.py
fla/ops/gated_oja_rule/__init__.py
fla/ops/gated_oja_rule/chunk.py
fla/ops/gated_oja_rule/chunk_h.py
fla/ops/gated_oja_rule/chunk_kkt.py
fla/ops/gated_oja_rule/chunk_o.py
fla/ops/gated_oja_rule/fused_recurrent.py
fla/ops/gated_oja_rule/wy_fast.py
fla/ops/generalized_delta_rule/__init__.py
fla/ops/generalized_delta_rule/dplr/__init__.py
fla/ops/generalized_delta_rule/dplr/chunk.py
fla/ops/generalized_delta_rule/dplr/chunk_A_bwd.py
fla/ops/generalized_delta_rule/dplr/chunk_A_fwd.py
fla/ops/generalized_delta_rule/dplr/chunk_h_bwd.py
fla/ops/generalized_delta_rule/dplr/chunk_h_fwd.py
fla/ops/generalized_delta_rule/dplr/chunk_o_bwd.py
fla/ops/generalized_delta_rule/dplr/chunk_o_fwd.py
fla/ops/generalized_delta_rule/dplr/fused_recurrent.py
fla/ops/generalized_delta_rule/dplr/naive.py
fla/ops/generalized_delta_rule/dplr/wy_fast_bwd.py
fla/ops/generalized_delta_rule/dplr/wy_fast_fwd.py
fla/ops/generalized_delta_rule/iplr/__init__.py
fla/ops/generalized_delta_rule/iplr/chunk.py
fla/ops/generalized_delta_rule/iplr/fused_recurrent.py
fla/ops/generalized_delta_rule/iplr/naive.py
fla/ops/generalized_delta_rule/iplr/wy_fast.py
fla/ops/gla/__init__.py
fla/ops/gla/chunk.py
fla/ops/gla/fused_chunk.py
fla/ops/gla/fused_recurrent.py
fla/ops/gla/naive.py
fla/ops/gsa/__init__.py
fla/ops/gsa/chunk.py
fla/ops/gsa/fused_recurrent.py
fla/ops/gsa/naive.py
fla/ops/hgrn/__init__.py
fla/ops/hgrn/chunk.py
fla/ops/hgrn/fused_recurrent.py
fla/ops/hgrn/naive.py
fla/ops/kda/__init__.py
fla/ops/kda/chunk.py
fla/ops/kda/chunk_bwd.py
fla/ops/kda/chunk_fwd.py
fla/ops/kda/chunk_intra.py
fla/ops/kda/chunk_intra_token_parallel.py
fla/ops/kda/fused_recurrent.py
fla/ops/kda/gate.py
fla/ops/kda/naive.py
fla/ops/kda/wy_fast.py
fla/ops/lightning_attn/__init__.py
fla/ops/lightning_attn/chunk.py
fla/ops/lightning_attn/fused_recurrent.py
fla/ops/linear_attn/__init__.py
fla/ops/linear_attn/chunk.py
fla/ops/linear_attn/fused_chunk.py
fla/ops/linear_attn/fused_recurrent.py
fla/ops/linear_attn/naive.py
fla/ops/linear_attn/utils.py
fla/ops/log_linear_attn/__init__.py
fla/ops/log_linear_attn/chunk.py
fla/ops/log_linear_attn/naive.py
fla/ops/mesa_net/__init__.py
fla/ops/mesa_net/chunk.py
fla/ops/mesa_net/chunk_cg_solver_bwd.py
fla/ops/mesa_net/chunk_cg_solver_fwd.py
fla/ops/mesa_net/chunk_h_fwd.py
fla/ops/mesa_net/chunk_h_kk_intra_bwd.py
fla/ops/mesa_net/chunk_h_kv_intra_bwd.py
fla/ops/mesa_net/chunk_h_kv_intra_bwd_separate.py
fla/ops/mesa_net/decoding_one_step.py
fla/ops/mesa_net/naive.py
fla/ops/nsa/__init__.py
fla/ops/nsa/compression.py
fla/ops/nsa/naive.py
fla/ops/nsa/parallel.py
fla/ops/nsa/utils.py
fla/ops/path_attn/__init__.py
fla/ops/path_attn/cumprod_householder_bwd.py
fla/ops/path_attn/cumprod_householder_fwd.py
fla/ops/path_attn/intra_chunk_preprocess_bwd.py
fla/ops/path_attn/intra_chunk_preprocess_bwd_prepare.py
fla/ops/path_attn/intra_chunk_preprocess_fwd.py
fla/ops/path_attn/naive.py
fla/ops/path_attn/parallel.py
fla/ops/path_attn/parallel_path_bwd_inter_dkv.py
fla/ops/path_attn/parallel_path_bwd_inter_dqh.py
fla/ops/path_attn/parallel_path_bwd_intra.py
fla/ops/path_attn/parallel_path_fwd.py
fla/ops/path_attn/prepare_k_cache.py
fla/ops/path_attn/transform_q.py
fla/ops/rebased/__init__.py
fla/ops/rebased/naive.py
fla/ops/rebased/parallel.py
fla/ops/retention/__init__.py
fla/ops/retention/chunk.py
fla/ops/retention/fused_chunk.py
fla/ops/retention/fused_recurrent.py
fla/ops/retention/naive.py
fla/ops/retention/parallel.py
fla/ops/rwkv4/__init__.py
fla/ops/rwkv4/fused_recurrent.py
fla/ops/rwkv6/__init__.py
fla/ops/rwkv6/chunk.py
fla/ops/rwkv6/chunk_naive.py
fla/ops/rwkv6/fused_recurrent.py
fla/ops/rwkv6/recurrent_naive.py
fla/ops/rwkv7/__init__.py
fla/ops/rwkv7/channel_mixing.py
fla/ops/rwkv7/chunk.py
fla/ops/rwkv7/fused_addcmul.py
fla/ops/rwkv7/fused_k_update.py
fla/ops/rwkv7/fused_recurrent.py
fla/ops/rwkv7/gate_output_correction.py
fla/ops/simple_gla/__init__.py
fla/ops/simple_gla/chunk.py
fla/ops/simple_gla/fused_chunk.py
fla/ops/simple_gla/fused_recurrent.py
fla/ops/simple_gla/naive.py
fla/ops/simple_gla/parallel.py
fla/ops/titans/__init__.py
fla/ops/titans/log_impl.py
fla/ops/titans/naive.py
fla/ops/ttt/__init__.py
fla/ops/ttt/chunk.py
fla/ops/ttt/fused_chunk.py
fla/ops/ttt/naive.py
fla/ops/utils/__init__.py
fla/ops/utils/constant.py
fla/ops/utils/cumsum.py
fla/ops/utils/index.py
fla/ops/utils/logcumsumexp.py
fla/ops/utils/logsumexp.py
fla/ops/utils/matmul.py
fla/ops/utils/op.py
fla/ops/utils/pack.py
fla/ops/utils/pooling.py
fla/ops/utils/softmax.py
fla/ops/utils/softplus.py
fla/ops/utils/solve_tril.py
fla_core.egg-info/PKG-INFO
fla_core.egg-info/SOURCES.txt
fla_core.egg-info/dependency_links.txt
fla_core.egg-info/requires.txt
fla_core.egg-info/top_level.txt