File tree Expand file tree Collapse file tree 2 files changed +2
-2
lines changed Expand file tree Collapse file tree 2 files changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -632,7 +632,7 @@ static bool llama_eval_internal(
632
632
auto & mem_at_token1 = lctx.mem_at_token1 ;
633
633
634
634
// TODO: fix this hardcoded size
635
- static size_t buf_size = size_t (n_ctx)*1024 *1024 ;
635
+ static size_t buf_size = size_t (n_ctx)*size_t (N)* 128 *1024 ;
636
636
static void * buf = malloc (buf_size);
637
637
638
638
const size_t C0 = mem_at_token0; // ~base
Original file line number Diff line number Diff line change @@ -219,7 +219,7 @@ int main(int argc, char ** argv) {
219
219
// (fill in mem_at_token0 and mem_at_token1)
220
220
// TODO: better way to do that
221
221
// TODO(Green-Sky): move to internal and detect first time usage
222
- {
222
+ if (!params. perplexity ) { // perplexity does not grow over time
223
223
// we make 2 evals, of batchsize to take 2 measurements, to determine base and growth
224
224
std::vector<llama_token> tmp (params.n_batch *2 , 2 );
225
225
tmp[0 ] = llama_token_bos ();
You can’t perform that action at this time.
0 commit comments