Contents:
Seshu
Seshu.push_to_hub()
Seshu.tokenize()
Seshu.train_lora()
MambaTrainer
MambaTrainer.compute_loss()
Seshu.model_merge_eval()
Seshu.pretrain()
compute_loss()
create_JSON()
evaluation()
get_checkpoint_model()
get_data()
load_data()
load_json()
make_config()
model_merge()
print_trainable_parameters()
MambaConfig
MambaConfig.model_type
MambaBlock
MambaBlock.forward()
MambaBlock.selective_scan()
MambaBlock.ssm()
MambaForCausalLM
MambaForCausalLM.forward()
MambaForCausalLM.get_decoder()
MambaForCausalLM.get_input_embeddings()
MambaForCausalLM.get_output_embeddings()
MambaForCausalLM.prepare_inputs_for_generation()
MambaForCausalLM.set_decoder()
MambaForCausalLM.set_input_embeddings()
MambaForCausalLM.set_output_embeddings()
MambaModel
MambaModel.forward()
MambaModel.get_input_embeddings()
MambaModel.set_input_embeddings()
MambaPreTrainedModel
MambaPreTrainedModel.base_model_prefix
MambaPreTrainedModel.config_class
MambaPreTrainedModel.supports_gradient_checkpointing
MambaRMSNorm
MambaRMSNorm.forward()
get_client_details()
verify_user_with_org()
load_model()
load_model_pretrained()
load_model_with_LoRA()
load_tokenizer()
split_data()