llmjava · dzlab · Aug 19, 2023 · Aug 19, 2023
diff --git a/src/main/java/com/github/llmjava/cohere4j/CohereApi.java b/src/main/java/com/github/llmjava/cohere4j/CohereApi.java
@@ -3,9 +3,11 @@
 import com.github.llmjava.cohere4j.request.ClassifyRequest;
 import com.github.llmjava.cohere4j.request.EmbedRequest;
 import com.github.llmjava.cohere4j.request.GenerateRequest;
+import com.github.llmjava.cohere4j.request.TokenizeRequest;
 import com.github.llmjava.cohere4j.response.ClassifyResponse;
 import com.github.llmjava.cohere4j.response.EmbedResponse;
 import com.github.llmjava.cohere4j.response.GenerateResponse;
+import com.github.llmjava.cohere4j.response.TokenizeResponse;
 import retrofit2.Call;
 import retrofit2.http.Body;
 import retrofit2.http.Headers;
@@ -14,24 +16,50 @@
 
 public interface CohereApi {
 
+    /**
+     * This endpoint generates realistic text conditioned on a given input.
+     */
     @POST("/v1/generate")
     @Headers({"accept: application/json", "content-type: application/json"})
     Call<GenerateResponse>
     generate(@Body GenerateRequest request);
 
+    /**
+     * This endpoint generates realistic text conditioned on a given input.
+     */
     @Streaming
     @POST("/v1/generate")
     @Headers({"accept: application/stream+json", "content-type: application/json"})
     Call<String>
     generateStream(@Body GenerateRequest request);
 
+    /**
+     * This endpoint returns text embeddings. An embedding is a list of floating point numbers that captures semantic information about the text that it represents.
+     *
+     * Embeddings can be used to create text classifiers as well as empower semantic search. To learn more about embeddings, see the embedding page.
+     *
+     * If you want to learn more how to use the embedding model, have a look at the Semantic Search Guide
+     */
     @POST("/v1/embed")
     @Headers({"accept: application/json", "content-type: application/json"})
     Call<EmbedResponse>
     embed(@Body EmbedRequest request);
 
+    /**
+     * This endpoint makes a prediction about which label fits the specified text inputs best. To make a prediction, Classify uses the provided examples of text + label pairs as a reference.
+     *
+     * Note: Custom Models trained on classification examples don't require the examples parameter to be passed in explicitly.
+     */
     @POST("/v1/classify")
     @Headers({"accept: application/json", "content-type: application/json"})
     Call<ClassifyResponse>
     classify(@Body ClassifyRequest request);
+
+    /**
+     * This endpoint splits input text into smaller units called tokens using byte-pair encoding (BPE). To learn more about tokenization and byte pair encoding, see the tokens page.
+     */
+    @POST("/v1/tokenize")
+    @Headers({"accept: application/json", "content-type: application/json"})
+    Call<TokenizeResponse>
+    tokenize(@Body TokenizeRequest request);
 }
diff --git a/src/main/java/com/github/llmjava/cohere4j/CohereClient.java b/src/main/java/com/github/llmjava/cohere4j/CohereClient.java
@@ -5,9 +5,11 @@
 import com.github.llmjava.cohere4j.request.ClassifyRequest;
 import com.github.llmjava.cohere4j.request.EmbedRequest;
 import com.github.llmjava.cohere4j.request.GenerateRequest;
+import com.github.llmjava.cohere4j.request.TokenizeRequest;
 import com.github.llmjava.cohere4j.response.ClassifyResponse;
 import com.github.llmjava.cohere4j.response.EmbedResponse;
 import com.github.llmjava.cohere4j.response.GenerateResponse;
+import com.github.llmjava.cohere4j.response.TokenizeResponse;
 import com.github.llmjava.cohere4j.response.streaming.StreamGenerateResponse;
 import com.github.llmjava.cohere4j.response.streaming.ResponseConverter;
 import com.google.gson.Gson;
@@ -80,6 +82,14 @@ public void classifyAsync(ClassifyRequest request, AsyncCallback<ClassifyRespons
         execute(api.classify(request), callback);
     }
 
+    public TokenizeResponse tokenize(TokenizeRequest request) {
+        return execute(api.tokenize(request));
+    }
+
+    public void tokenizeAsync(TokenizeRequest request, AsyncCallback<TokenizeResponse> callback) {
+        execute(api.tokenize(request), callback);
+    }
+
     private <T> T execute(Call<T> action) {
         try {
             Response<T> response = action.execute();

diff --git a/src/main/java/com/github/llmjava/cohere4j/request/TokenizeRequest.java b/src/main/java/com/github/llmjava/cohere4j/request/TokenizeRequest.java
@@ -0,0 +1,38 @@
+package com.github.llmjava.cohere4j.request;
+
+public class TokenizeRequest {
+    /**
+     * The string to be tokenized, the minimum text length is 1 character, and the maximum text length is 65536 characters.
+     */
+    private String text;
+    /**
+     * An optional parameter to provide the model name. This will ensure that the tokenization uses the tokenizer used by that model.
+     */
+    private String model;
+
+
+    TokenizeRequest(Builder builder) {
+        this.text = builder.text;
+        this.model = builder.model;
+    }
+
+    public static class Builder {
+
+        private String text;
+        private String model;
+
+        public Builder withText(String text) {
+            this.text = text;
+            return this;
+        }
+
+        public Builder withModel(String model) {
+            this.model = model;
+            return this;
+        }
+
+        public TokenizeRequest build() {
+            return new TokenizeRequest(this);
+        }
+    }
+}
diff --git a/src/main/java/com/github/llmjava/cohere4j/response/TokenizeResponse.java b/src/main/java/com/github/llmjava/cohere4j/response/TokenizeResponse.java
@@ -0,0 +1,23 @@
+package com.github.llmjava.cohere4j.response;
+
+public class TokenizeResponse {
+    private Integer[] tokens;
+    private String[] token_strings;
+    private Meta meta;
+
+    public Integer[] getTokens() {
+        return tokens;
+    }
+
+    public Integer getToken(int index) {
+        return tokens[index];
+    }
+
+    public String[] getTokenStrings() {
+        return token_strings;
+    }
+
+    public String getTokenString(int index) {
+        return token_strings[index];
+    }
+}
diff --git a/src/test/java/com/github/llmjava/cohere4j/ClassificationExample.java b/src/test/java/com/github/llmjava/cohere4j/ClassificationExample.java
@@ -2,9 +2,7 @@
 
 import com.github.llmjava.cohere4j.callback.AsyncCallback;
 import com.github.llmjava.cohere4j.request.ClassifyRequest;
-import com.github.llmjava.cohere4j.request.EmbedRequest;
 import com.github.llmjava.cohere4j.response.ClassifyResponse;
-import com.github.llmjava.cohere4j.response.EmbedResponse;
 import org.apache.commons.configuration2.ex.ConfigurationException;
 
 public class ClassificationExample {
@@ -39,9 +37,9 @@ public static void main(String[] args) throws ConfigurationException {
             @Override
             public void onSuccess(ClassifyResponse response) {
                 System.out.println("--- Async example - onSuccess");
-                System.out.println("Input: " + response.getClassification(0).getInput());
-                System.out.println("Prediction: " + response.getClassification(0).getPrediction());
-                System.out.println("Confidence: " + response.getClassification(0).getConfidence());            }
+                System.out.println("Input: " + response.getClassification(1).getInput());
+                System.out.println("Prediction: " + response.getClassification(1).getPrediction());
+                System.out.println("Confidence: " + response.getClassification(1).getConfidence());            }
 
             @Override
             public void onFailure(Throwable throwable) {

diff --git a/src/test/java/com/github/llmjava/cohere4j/GenerationExample.java b/src/test/java/com/github/llmjava/cohere4j/GenerationExample.java
@@ -20,7 +20,7 @@ public static void main(String[] args) throws ConfigurationException {
                 .build();
 
         System.out.println("--- Sync example");
-        System.out.println(client.generate(request1).getTexts());
+        System.out.println(client.generate(request1).getTexts().get(0));
         client.generateAsync(request1, new AsyncCallback<GenerateResponse>() {
             @Override
             public void onSuccess(GenerateResponse completion) {

diff --git a/src/test/java/com/github/llmjava/cohere4j/TokenizationExample.java b/src/test/java/com/github/llmjava/cohere4j/TokenizationExample.java
@@ -0,0 +1,39 @@
+package com.github.llmjava.cohere4j;
+
+import com.github.llmjava.cohere4j.callback.AsyncCallback;
+import com.github.llmjava.cohere4j.request.TokenizeRequest;
+import com.github.llmjava.cohere4j.response.TokenizeResponse;
+import org.apache.commons.configuration2.ex.ConfigurationException;
+
+public class TokenizationExample {
+
+    public static void main(String[] args) throws ConfigurationException {
+        CohereConfig config = CohereConfig.fromProperties("cohere.properties");
+        CohereClient client = new CohereClient.Builder().withConfig(config).build();
+
+        TokenizeRequest request = new TokenizeRequest.Builder()
+                .withText("tokenize me! :D")
+                .withModel("command")
+                .build();
+
+        System.out.println("--- Sync example");
+        TokenizeResponse response = client.tokenize(request);
+        System.out.println("Token: " + response.getTokenString(0));
+        System.out.println("Token ID: " + response.getToken(0));
+
+        client.tokenizeAsync(request, new AsyncCallback<TokenizeResponse>() {
+            @Override
+            public void onSuccess(TokenizeResponse response) {
+                System.out.println("--- Async example - onSuccess");
+                System.out.println("Token: " + response.getTokenString(0));
+                System.out.println("Token ID: " + response.getToken(0));
+            }
+
+            @Override
+            public void onFailure(Throwable throwable) {
+                System.out.println("--- Async example - onFailure");
+                throwable.printStackTrace();
+            }
+        });
+    }
+}