SYMBOL INDEX (144 symbols across 17 files) FILE: finetune_moss.py class SFTDataset (line 25) | class SFTDataset(Dataset): method __init__ (line 26) | def __init__(self, data_dir, tokenizer, data_type='train'): method load_data (line 40) | def load_data(self): method __len__ (line 97) | def __len__(self): method __getitem__ (line 100) | def __getitem__(self, index): method collate_fn (line 113) | def collate_fn(self, batch): class SFTMetric (line 127) | class SFTMetric: method __init__ (line 128) | def __init__(self, device): method __call__ (line 135) | def __call__(self, logits, labels, loss): method update (line 138) | def update(self, logits, labels, loss): method get_metric (line 147) | def get_metric(self, reset=True): function train (line 163) | def train(args): FILE: models/configuration_moss.py class MossConfig (line 10) | class MossConfig(PretrainedConfig): method __init__ (line 75) | def __init__( FILE: models/custom_autotune.py class Autotuner (line 14) | class Autotuner(triton.KernelInterface): method __init__ (line 15) | def __init__(self, fn, arg_names, configs, key, reset_to_zero, prune_c... method _bench (line 51) | def _bench(self, *args, config, **meta): method run (line 75) | def run(self, *args, **kwargs): method prune_configs (line 104) | def prune_configs(self, kwargs): method warmup (line 121) | def warmup(self, *args, **kwargs): function autotune (line 134) | def autotune(configs, key, prune_configs_by=None, reset_to_zero=None, ne... FILE: models/modeling_moss.py function create_sinusoidal_positions (line 40) | def create_sinusoidal_positions(num_pos: int, dim: int) -> torch.Tensor: function rotate_every_two (line 47) | def rotate_every_two(x: torch.Tensor) -> torch.Tensor: function apply_rotary_pos_emb (line 55) | def apply_rotary_pos_emb(tensor: torch.Tensor, sin: torch.Tensor, cos: t... class MossAttention (line 61) | class MossAttention(nn.Module): method __init__ (line 62) | def __init__(self, config): method _split_heads (line 92) | def _split_heads(self, x, n_head, dim_head, mp_num): method _merge_heads (line 97) | def _merge_heads(self, tensor, num_attention_heads, attn_head_size): method _attn (line 110) | def _attn( method forward (line 151) | def forward( class MossMLP (line 230) | class MossMLP(nn.Module): method __init__ (line 231) | def __init__(self, intermediate_size, config): # in MLP: intermediate... method forward (line 241) | def forward(self, hidden_states: Optional[torch.FloatTensor]) -> torch... class MossBlock (line 250) | class MossBlock(nn.Module): method __init__ (line 251) | def __init__(self, config): method forward (line 258) | def forward( class MossPreTrainedModel (line 293) | class MossPreTrainedModel(PreTrainedModel): method __init__ (line 304) | def __init__(self, *inputs, **kwargs): method _init_weights (line 307) | def _init_weights(self, module): method _set_gradient_checkpointing (line 323) | def _set_gradient_checkpointing(self, module, value=False): class MossModel (line 393) | class MossModel(MossPreTrainedModel): method __init__ (line 394) | def __init__(self, config): method get_input_embeddings (line 410) | def get_input_embeddings(self): method set_input_embeddings (line 413) | def set_input_embeddings(self, new_embeddings): method forward (line 422) | def forward( class MossForCausalLM (line 586) | class MossForCausalLM(MossPreTrainedModel): method __init__ (line 589) | def __init__(self, config): method get_output_embeddings (line 616) | def get_output_embeddings(self): method set_output_embeddings (line 619) | def set_output_embeddings(self, new_embeddings): method prepare_inputs_for_generation (line 622) | def prepare_inputs_for_generation(self, input_ids, past_key_values=Non... method forward (line 655) | def forward( method _reorder_cache (line 722) | def _reorder_cache( method quantize (line 735) | def quantize(self, wbits, groupsize): FILE: models/quantization.py function find_layers (line 11) | def find_layers(module, layers=[nn.Conv2d, nn.Linear], name=''): function matmul_248_kernel (line 57) | def matmul_248_kernel(a_ptr, b_ptr, c_ptr, function trans_matmul_248_kernel (line 168) | def trans_matmul_248_kernel(a_ptr, b_ptr, c_ptr, function matmul248 (line 246) | def matmul248(input, qweight, scales, qzeros, g_idx, bits, maxq): function transpose_matmul248 (line 260) | def transpose_matmul248(input, qweight, scales, qzeros, g_idx, bits, maxq): class QuantLinearFunction (line 275) | class QuantLinearFunction(torch.autograd.Function): method forward (line 278) | def forward(ctx, input, qweight, scales, qzeros, g_idx, bits, maxq): method backward (line 286) | def backward(ctx, grad_output): class QuantLinear (line 295) | class QuantLinear(nn.Module): method __init__ (line 296) | def __init__(self, bits, groupsize, infeatures, outfeatures, bias): method pack (line 315) | def pack(self, linear, scales, zeros, g_idx=None): method forward (line 365) | def forward(self, x): function make_quant (line 372) | def make_quant(module, names, bits, groupsize, name=''): function quantize_with_gptq (line 385) | def quantize_with_gptq(model, wbits, groupsize): FILE: models/tokenization_moss.py function bytes_to_unicode (line 62) | def bytes_to_unicode(): function get_pairs (line 86) | def get_pairs(word): class MossTokenizer (line 100) | class MossTokenizer(PreTrainedTokenizer): method __init__ (line 144) | def __init__( method vocab_size (line 190) | def vocab_size(self): method get_vocab (line 193) | def get_vocab(self): method bpe (line 196) | def bpe(self, token): method build_inputs_with_special_tokens (line 238) | def build_inputs_with_special_tokens(self, token_ids_0, token_ids_1=No... method _tokenize (line 251) | def _tokenize(self, text): method _convert_token_to_id (line 261) | def _convert_token_to_id(self, token): method _convert_id_to_token (line 265) | def _convert_id_to_token(self, index): method convert_tokens_to_string (line 269) | def convert_tokens_to_string(self, tokens): method save_vocabulary (line 275) | def save_vocabulary(self, save_directory: str, filename_prefix: Option... method prepare_for_tokenization (line 304) | def prepare_for_tokenization(self, text, is_split_into_words=False, **... method decode (line 310) | def decode( method truncate (line 354) | def truncate(self, completion, truncate_before_pattern): FILE: models_jittor/generation.py function generate (line 3) | def generate(moss, input_str, tokenizer, method, **kwargs): function greedy_search (line 25) | def greedy_search(model, input_str, tokenizer, max_gen_len, function sample (line 76) | def sample(model, input_str, tokenizer, max_gen_len, temperature, top_p,... function sample_top_k (line 138) | def sample_top_k(scores, top_k): function sample_top_p (line 146) | def sample_top_p(scores, top_p): FILE: models_jittor/load.py function load_from_torch_shard_ckpt (line 9) | def load_from_torch_shard_ckpt(model, ckpt_dir): function load_from_map (line 29) | def load_from_map(model: jt.Module, ckpt_dir, file_weight_map): function check_state_dict (line 48) | def check_state_dict(model: jt.Module, ckpt_dir, file_weight_map): FILE: models_jittor/model.py class MossAttention (line 12) | class MossAttention(Module): method __init__ (line 13) | def __init__(self, config): method _split_heads (line 44) | def _split_heads(self, x, n_head, dim_head, mp_num): method _merge_heads (line 49) | def _merge_heads(self, tensor, num_attention_heads, attn_head_size): method _attn (line 62) | def _attn( method execute (line 104) | def execute( class MossMLP (line 178) | class MossMLP(Module): method __init__ (line 179) | def __init__(self, intermediate_size, config): method execute (line 190) | def execute(self, hidden_states: Optional[jt.Var]) -> jt.Var: class MossBlock (line 198) | class MossBlock(Module): method __init__ (line 199) | def __init__(self, config): method execute (line 207) | def execute( class MossModel (line 238) | class MossModel(Module): method __init__ (line 239) | def __init__(self, config): method execute (line 255) | def execute( class MossForCausalLM (line 347) | class MossForCausalLM(Module): method __init__ (line 349) | def __init__(self, config): method execute (line 358) | def execute( FILE: models_jittor/utils.py class NewGELUActivation (line 6) | class NewGELUActivation(jt.Module): method execute (line 8) | def execute(self, input): function fixed_pos_embedding (line 16) | def fixed_pos_embedding(x, seq_dim=1, seq_len=None): function rotate_every_two (line 28) | def rotate_every_two(x): function duplicate_interleave (line 34) | def duplicate_interleave(m): function apply_rotary_pos_emb (line 45) | def apply_rotary_pos_emb(x, sincos, offset=0): function _init_weights (line 50) | def _init_weights(module, config): function _convert_head_mask_to_5d (line 65) | def _convert_head_mask_to_5d(head_mask, num_hidden_layers, dtype): function get_head_mask (line 76) | def get_head_mask( FILE: moss_api_demo.py function create_item (line 72) | async def create_item(request: Request): FILE: moss_cli_demo.py function clear (line 50) | def clear(): function main (line 53) | def main(): FILE: moss_cli_demo_jittor.py function clear (line 46) | def clear(): function main (line 49) | def main(): FILE: moss_inference.py class Inference (line 44) | class Inference: method __init__ (line 45) | def __init__( method Init_Model_Parallelism (line 87) | def Init_Model_Parallelism(self, raw_model_dir: str, device_map: Union... method preprocess (line 127) | def preprocess(self, raw_text: str) -> Tuple[torch.Tensor, torch.Tensor]: method forward (line 144) | def forward( method postprocess_remove_prefix (line 181) | def postprocess_remove_prefix(self, preds_i: str) -> str: method streaming_topk_search (line 193) | def streaming_topk_search( method top_k_top_p_filtering (line 291) | def top_k_top_p_filtering(self, logits, top_k, top_p, filter_value=-fl... method infer_ (line 315) | def infer_( method __call__ (line 342) | def __call__(self, input): FILE: moss_web_demo_gradio.py function postprocess (line 68) | def postprocess(self, y): function parse_text (line 82) | def parse_text(text): function predict (line 115) | def predict(input, chatbot, max_length, top_p, temperature, history): function reset_user_input (line 146) | def reset_user_input(): function reset_state (line 150) | def reset_state(): FILE: moss_web_demo_streamlit.py function load_model (line 47) | def load_model(): function generate_answer (line 92) | def generate_answer(): function clear_history (line 126) | def clear_history(): FILE: utils.py class StopWordsCriteria (line 5) | class StopWordsCriteria(StoppingCriteria): method __init__ (line 7) | def __init__(self, stop_indices: list): method __call__ (line 10) | def __call__(self, input_ids: torch.LongTensor, scores: torch.FloatTen...