Skip to content

Commit bb093eb

Browse files
authored
Merge pull request #4 from ggerganov/server-parallel
server-parallel : add "--reverse-prompt" + compiler warning fixes
2 parents afc09db + 5ab6c21 commit bb093eb

File tree

1 file changed

+26
-14
lines changed

1 file changed

+26
-14
lines changed

examples/server-parallel/server.cpp

Lines changed: 26 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -1,13 +1,15 @@
1-
#include <chrono>
1+
#include "frontend.h"
2+
#include "common.h"
3+
#include "llama.h"
4+
25
#include "../server/httplib.h"
36
#include "../server/json.hpp"
7+
48
#include <iostream>
59
#include <sstream>
610
#include <thread>
711
#include <vector>
8-
#include "frontend.h"
9-
#include "common.h"
10-
#include "llama.h"
12+
#include <chrono>
1113

1214
using namespace httplib;
1315
using namespace std;
@@ -241,9 +243,7 @@ struct server_parallel_context {
241243
string prompt = data.value("prompt", "");
242244
for (llama_client_slot & slot : slots)
243245
{
244-
if (
245-
slot_id == -1 && slot.available() ||
246-
slot.id == slot_id)
246+
if ((slot_id == -1 && slot.available()) || slot.id == slot_id)
247247
{
248248
slot.start(prompt, temperature);
249249
LOG_TEE("slot %i is processing\n", slot.id);
@@ -429,8 +429,6 @@ struct server_parallel_context {
429429
slot.generated_text += token_str;
430430
slot.sampled = id;
431431

432-
size_t pos = 0;
433-
434432
size_t stop_pos =
435433
findStoppingStrings(slot.generated_text, token_str.size(), STOP_FULL);
436434

@@ -740,20 +738,34 @@ static void server_params_parse(int argc, char **argv, server_params &sparams,
740738
else if (arg == "--numa")
741739
{
742740
params.numa = true;
743-
} else if (arg == "-cb" || arg == "--cont-batching") {
741+
} else if (arg == "-cb" || arg == "--cont-batching")
742+
{
744743
params.cont_batching = true;
745-
} else if (arg == "-np" || arg == "--parallel") {
746-
if (++i >= argc) {
744+
}
745+
else if (arg == "-np" || arg == "--parallel")
746+
{
747+
if (++i >= argc)
748+
{
747749
invalid_param = true;
748750
break;
749751
}
750752
params.n_parallel = std::stoi(argv[i]);
751-
} else if (arg == "-n" || arg == "--n-predict") {
752-
if (++i >= argc) {
753+
} else if (arg == "-n" || arg == "--n-predict")
754+
{
755+
if (++i >= argc)
756+
{
753757
invalid_param = true;
754758
break;
755759
}
756760
params.n_predict = std::stoi(argv[i]);
761+
} else if (arg == "-r" || arg == "--reverse-prompt")
762+
{
763+
if (++i >= argc)
764+
{
765+
invalid_param = true;
766+
break;
767+
}
768+
params.antiprompt.push_back(argv[i]);
757769
}
758770
else
759771
{

0 commit comments

Comments
 (0)