We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent e066071 commit 46f6fd2Copy full SHA for 46f6fd2
tools/server/server-context.cpp
@@ -35,10 +35,10 @@ constexpr int HTTP_POLLING_SECONDS = 1;
35
// state diagram: https://github.com/ggml-org/llama.cpp/pull/9283
36
enum slot_state {
37
SLOT_STATE_IDLE,
38
- SLOT_STATE_STARTED, // after assigning a task
+ SLOT_STATE_WAIT_OTHER, // after assigning a task, but waiting for parent slot to process prompt
39
+ SLOT_STATE_STARTED, // after assigning a task and about to process prompt
40
SLOT_STATE_PROCESSING_PROMPT,
41
SLOT_STATE_DONE_PROMPT,
- SLOT_STATE_WAIT_OTHER, // prompt processed, but waiting for other slots to copy the state
42
SLOT_STATE_GENERATING,
43
};
44
0 commit comments