SYMBOL INDEX (24 symbols across 7 files) FILE: examples/run_streaming_llama.py function greedy_generate (line 19) | def greedy_generate(model, tokenizer, input_ids, past_key_values, max_ge... function streaming_inference (line 61) | def streaming_inference(model, tokenizer, prompts, kv_cache=None, max_ge... function main (line 78) | def main(args): FILE: streaming_llm/enable_streaming_llm.py function enable_streaming_llm (line 4) | def enable_streaming_llm(model, start_size, recent_size): FILE: streaming_llm/kv_cache.py function slice2d (line 4) | def slice2d(x, start, end): function slice3d (line 8) | def slice3d(x, start, end): function slice1d (line 12) | def slice1d(x, start, end): class StartRecentKVCache (line 23) | class StartRecentKVCache: method __init__ (line 24) | def __init__( method __call__ (line 40) | def __call__(self, past_key_values): method evict_for_space (line 66) | def evict_for_space(self, past_key_values, num_coming): method evict_range (line 96) | def evict_range(self, past_key_values, start, end): FILE: streaming_llm/pos_shift/modify_falcon.py function falcon_pos_shift_attention_forward (line 19) | def falcon_pos_shift_attention_forward( function enable_falcon_pos_shift_attention (line 152) | def enable_falcon_pos_shift_attention(model): FILE: streaming_llm/pos_shift/modify_gpt_neox.py function apply_rotary_pos_emb_single (line 20) | def apply_rotary_pos_emb_single(x, cos, sin, position_ids): function gpt_neox_pos_shift_attention_forward (line 29) | def gpt_neox_pos_shift_attention_forward( function enable_gpt_neox_pos_shift_attention (line 99) | def enable_gpt_neox_pos_shift_attention(model): FILE: streaming_llm/pos_shift/modify_llama.py function apply_rotary_pos_emb_single (line 21) | def apply_rotary_pos_emb_single(x, cos, sin, position_ids): function llama_pos_shift_attention_forward (line 31) | def llama_pos_shift_attention_forward( function enable_llama_pos_shift_attention (line 164) | def enable_llama_pos_shift_attention(model): FILE: streaming_llm/utils.py function parse_args (line 14) | def parse_args(): function load (line 51) | def load(model_name_or_path): function download_url (line 75) | def download_url(url: str, folder="folder"): function load_jsonl (line 105) | def load_jsonl(