24 lines
821 B
Python
Raw Permalink Normal View History

# Copyright (c) Sebastian Raschka under Apache License 2.0 (see LICENSE.txt).
# Source for "Build a Large Language Model From Scratch"
# - https://www.manning.com/books/build-a-large-language-model-from-scratch
# Code: https://github.com/rasbt/LLMs-from-scratch
class KVCache:
def __init__(self, n_layers, batch_size):
self.cache = [
[None for _ in range(batch_size)] for _ in range(n_layers)
]
def get(self, layer_idx, batch_idx):
return self.cache[layer_idx][batch_idx]
def update(self, layer_idx, batch_idx, value):
self.cache[layer_idx][batch_idx] = value
def get_layer(self, layer_idx):
return self.cache[layer_idx]
def reset(self):
for layer in self.cache:
for i in range(len(layer)):
layer[i] = None