Add interactive total token count label, codebase refactoring

This commit is contained in:
Carl-Robert Linnupuu 2023-11-14 13:27:15 +02:00
parent d8e5e18998
commit ec3120a5e6
31 changed files with 804 additions and 322 deletions

View file

@ -6,6 +6,7 @@ import com.knuddels.jtokkit.Encodings;
import com.knuddels.jtokkit.api.Encoding;
import com.knuddels.jtokkit.api.EncodingRegistry;
import com.knuddels.jtokkit.api.EncodingType;
import ee.carlrobert.codegpt.conversations.Conversation;
import ee.carlrobert.llm.client.openai.completion.chat.request.OpenAIChatCompletionMessage;
@Service
@ -21,9 +22,23 @@ public final class EncodingManager {
return ApplicationManager.getApplication().getService(EncodingManager.class);
}
public int countConversationTokens(Conversation conversation) {
if (conversation != null) {
return conversation.getMessages().stream()
.mapToInt(
message -> countTokens(message.getPrompt()) + countTokens(message.getResponse()))
.sum();
}
return 0;
}
public int countMessageTokens(OpenAIChatCompletionMessage message) {
return countMessageTokens(message.getRole(), message.getContent());
}
public int countMessageTokens(String role, String content) {
var tokensPerMessage = 4; // every message follows <|start|>{role/name}\n{content}<|end|>\n
return encoding.countTokens(message.getRole() + message.getContent()) + tokensPerMessage;
return countTokens(role + content) + tokensPerMessage;
}
public int countTokens(String text) {