Skip to content

Commit 85de4ca

Browse files
refactor
1 parent ce3c810 commit 85de4ca

File tree

5 files changed

+2
-173
lines changed

5 files changed

+2
-173
lines changed

models/batch_generation.py

Lines changed: 0 additions & 62 deletions
This file was deleted.

models/bench.py

Lines changed: 0 additions & 57 deletions
This file was deleted.

models/bench.sh

Lines changed: 0 additions & 10 deletions
This file was deleted.

models/generation.py

Lines changed: 0 additions & 42 deletions
This file was deleted.

models/llama.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,9 +3,9 @@
33
from transformers.models.llama.modeling_llama import LlamaDecoderLayer
44
import torch.nn.functional as F
55
import gc
6-
from utils import apply_rotary_pos_emb, layer_norm, topp_temperature_decode
6+
from .utils import apply_rotary_pos_emb, layer_norm, topp_temperature_decode
77
import flashinfer
8-
from attnserver import LSHSparseAttnServer, AttnServer
8+
from .attnserver import LSHSparseAttnServer, AttnServer
99
class LLMLayer:
1010
def __init__(self, layer_idx) -> None:
1111

0 commit comments

Comments
 (0)