microsoft
diff --git a/‎aiservices/google/src/main/java/com/microsoft/semantickernel/aiservices/google/chatcompletion/GeminiChatCompletion.java
+49-1 b/‎aiservices/google/src/main/java/com/microsoft/semantickernel/aiservices/google/chatcompletion/GeminiChatCompletion.java
+49-1
diff --git a/‎aiservices/google/src/main/java/com/microsoft/semantickernel/aiservices/google/chatcompletion/GeminiStreamingChatMessageContent.java
+45 b/‎aiservices/google/src/main/java/com/microsoft/semantickernel/aiservices/google/chatcompletion/GeminiStreamingChatMessageContent.java
+45
diff --git a/‎semantickernel-api/src/main/java/com/microsoft/semantickernel/services/textcompletion/StreamingTextContent.java renamed to ‎aiservices/google/src/main/java/com/microsoft/semantickernel/aiservices/google/textcompletion/GeminiStreamingTextContent.java
+5-4 b/‎semantickernel-api/src/main/java/com/microsoft/semantickernel/services/textcompletion/StreamingTextContent.java renamed to ‎aiservices/google/src/main/java/com/microsoft/semantickernel/aiservices/google/textcompletion/GeminiStreamingTextContent.java
+5-4
diff --git a/‎aiservices/google/src/main/java/com/microsoft/semantickernel/aiservices/google/textcompletion/GeminiTextGenerationService.java
+10-10 b/‎aiservices/google/src/main/java/com/microsoft/semantickernel/aiservices/google/textcompletion/GeminiTextGenerationService.java
+10-10
diff --git a/‎aiservices/huggingface/src/main/java/com/microsoft/semantickernel/aiservices/huggingface/services/HuggingFaceTextGenerationService.java
+1-1 b/‎aiservices/huggingface/src/main/java/com/microsoft/semantickernel/aiservices/huggingface/services/HuggingFaceTextGenerationService.java
+1-1
diff --git a/‎aiservices/openai/src/main/java/com/microsoft/semantickernel/aiservices/openai/chatcompletion/OpenAIChatCompletion.java
+88 b/‎aiservices/openai/src/main/java/com/microsoft/semantickernel/aiservices/openai/chatcompletion/OpenAIChatCompletion.java
+88
diff --git a/‎aiservices/openai/src/main/java/com/microsoft/semantickernel/aiservices/openai/chatcompletion/OpenAIStreamingChatMessageContent.java
+41 b/‎aiservices/openai/src/main/java/com/microsoft/semantickernel/aiservices/openai/chatcompletion/OpenAIStreamingChatMessageContent.java
+41
diff --git a/‎aiservices/openai/src/main/java/com/microsoft/semantickernel/aiservices/openai/textcompletion/OpenAIStreamingTextContent.java
+34 b/‎aiservices/openai/src/main/java/com/microsoft/semantickernel/aiservices/openai/textcompletion/OpenAIStreamingTextContent.java
+34
@@ -16,6 +16,7 @@
 import com.google.protobuf.Value;
 import com.microsoft.semantickernel.Kernel;
 import com.microsoft.semantickernel.aiservices.google.GeminiService;
+import com.microsoft.semantickernel.aiservices.google.GeminiServiceBuilder;
 import com.microsoft.semantickernel.aiservices.google.implementation.MonoConverter;
 import com.microsoft.semantickernel.contextvariables.ContextVariableTypes;
 import com.microsoft.semantickernel.exceptions.AIException;
@@ -36,7 +37,7 @@
 import com.microsoft.semantickernel.services.chatcompletion.ChatCompletionService;
 import com.microsoft.semantickernel.services.chatcompletion.ChatHistory;
 import com.microsoft.semantickernel.services.chatcompletion.ChatMessageContent;
-import com.microsoft.semantickernel.aiservices.google.GeminiServiceBuilder;
+import com.microsoft.semantickernel.services.chatcompletion.StreamingChatContent;
 import java.io.IOException;
 import java.time.OffsetDateTime;
 import java.util.ArrayList;
@@ -75,6 +76,53 @@ public Mono<List<ChatMessageContent<?>>> getChatMessageContentsAsync(String prom
             invocationContext);
     }
 
+    @Override
+    public Flux<StreamingChatContent<?>> getStreamingChatMessageContentsAsync(
+        ChatHistory chatHistory,
+        @Nullable Kernel kernel,
+        @Nullable InvocationContext invocationContext) {
+
+        LOGGER.warn("Streaming has been called on GeminiChatCompletion service. "
+            + "This is currently not supported in Gemini. "
+            + "The results will be returned in a non streaming fashion.");
+
+        return getChatMessageContentsAsync(chatHistory, kernel, invocationContext)
+            .flatMapIterable(chatMessageContents -> chatMessageContents)
+            .map(content -> {
+                return new GeminiStreamingChatMessageContent(
+                    content.getAuthorRole(),
+                    content.getContent(),
+                    getModelId(),
+                    content.getInnerContent(),
+                    content.getEncoding(),
+                    content.getMetadata(),
+                    null,
+                    UUID.randomUUID().toString());
+            });
+    }
+
+    @Override
+    public Flux<StreamingChatContent<?>> getStreamingChatMessageContentsAsync(String prompt,
+        @Nullable Kernel kernel, @Nullable InvocationContext invocationContext) {
+        LOGGER.warn("Streaming has been called on GeminiChatCompletion service. "
+            + "This is currently not supported in Gemini. "
+            + "The results will be returned in a non streaming fashion.");
+
+        return getChatMessageContentsAsync(prompt, kernel, invocationContext)
+            .flatMapIterable(chatMessageContents -> chatMessageContents)
+            .map(content -> {
+                return new GeminiStreamingChatMessageContent(
+                    content.getAuthorRole(),
+                    content.getContent(),
+                    getModelId(),
+                    content.getInnerContent(),
+                    content.getEncoding(),
+                    content.getMetadata(),
+                    null,
+                    UUID.randomUUID().toString());
+            });
+    }
+
     @Override
     public Mono<List<ChatMessageContent<?>>> getChatMessageContentsAsync(ChatHistory chatHistory,
         @Nullable Kernel kernel, @Nullable InvocationContext invocationContext) {
 
@@ -0,0 +1,45 @@
+// Copyright (c) Microsoft. All rights reserved.
+package com.microsoft.semantickernel.aiservices.google.chatcompletion;
+
+import com.microsoft.semantickernel.orchestration.FunctionResultMetadata;
+import com.microsoft.semantickernel.services.chatcompletion.AuthorRole;
+import com.microsoft.semantickernel.services.chatcompletion.StreamingChatContent;
+import java.nio.charset.Charset;
+import java.util.List;
+import javax.annotation.Nullable;
+
+/**
+ * Represents the content of a chat message.
+ *
+ * @param <T> The type of the inner content.
+ */
+public class GeminiStreamingChatMessageContent<T> extends GeminiChatMessageContent<T> implements
+    StreamingChatContent<T> {
+
+    private final String id;
+
+    /**
+     * Creates a new instance of the {@link GeminiChatMessageContent} class.
+     *
+     * @param authorRole          The author role that generated the content.
+     * @param content             The content.
+     * @param modelId             The model id.
+     * @param innerContent        The inner content.
+     * @param encoding            The encoding.
+     * @param metadata            The metadata.
+     * @param geminiFunctionCalls The function calls.
+     */
+    public GeminiStreamingChatMessageContent(AuthorRole authorRole, String content,
+        @Nullable String modelId, @Nullable T innerContent, @Nullable Charset encoding,
+        @Nullable FunctionResultMetadata metadata,
+        @Nullable List<GeminiFunctionCall> geminiFunctionCalls,
+        String id) {
+        super(authorRole, content, modelId, innerContent, encoding, metadata, geminiFunctionCalls);
+        this.id = id;
+    }
+
+    @Override
+    public String getId() {
+        return id;
+    }
+}
@@ -1,21 +1,22 @@
 // Copyright (c) Microsoft. All rights reserved.
-package com.microsoft.semantickernel.services.textcompletion;
+package com.microsoft.semantickernel.aiservices.google.textcompletion;
 
-import com.microsoft.semantickernel.services.StreamingKernelContent;
+import com.microsoft.semantickernel.services.StreamingTextContent;
+import com.microsoft.semantickernel.services.textcompletion.TextContent;
 import javax.annotation.Nullable;
 
 /**
  * StreamingTextContent is a wrapper for TextContent that allows for streaming.
  */
-public class StreamingTextContent extends StreamingKernelContent<TextContent> {
+public class GeminiStreamingTextContent extends StreamingTextContent<TextContent> {
 
     /**
      * Initializes a new instance of the {@code StreamingTextContent} class with a provided text
      * content.
      *
      * @param content The text content.
      */
-    public StreamingTextContent(TextContent content) {
+    public GeminiStreamingTextContent(TextContent content) {
         super(content, 0, null, null);
     }
 
 
@@ -7,30 +7,29 @@
 import com.google.cloud.vertexai.generativeai.GenerativeModel;
 import com.microsoft.semantickernel.Kernel;
 import com.microsoft.semantickernel.aiservices.google.GeminiService;
+import com.microsoft.semantickernel.aiservices.google.GeminiServiceBuilder;
 import com.microsoft.semantickernel.aiservices.google.implementation.MonoConverter;
 import com.microsoft.semantickernel.exceptions.AIException;
 import com.microsoft.semantickernel.exceptions.SKCheckedException;
 import com.microsoft.semantickernel.exceptions.SKException;
 import com.microsoft.semantickernel.orchestration.FunctionResultMetadata;
 import com.microsoft.semantickernel.orchestration.PromptExecutionSettings;
-import com.microsoft.semantickernel.aiservices.google.GeminiServiceBuilder;
-import com.microsoft.semantickernel.services.textcompletion.StreamingTextContent;
+import com.microsoft.semantickernel.services.StreamingTextContent;
 import com.microsoft.semantickernel.services.textcompletion.TextContent;
 import com.microsoft.semantickernel.services.textcompletion.TextGenerationService;
-import reactor.core.publisher.Flux;
-import reactor.core.publisher.Mono;
-
-import org.slf4j.Logger;
-import org.slf4j.LoggerFactory;
-
-import javax.annotation.Nullable;
 import java.io.IOException;
 import java.time.OffsetDateTime;
 import java.util.ArrayList;
 import java.util.List;
 import java.util.UUID;
+import javax.annotation.Nullable;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
+import reactor.core.publisher.Flux;
+import reactor.core.publisher.Mono;
 
 public class GeminiTextGenerationService extends GeminiService implements TextGenerationService {
+
     private static final Logger LOGGER = LoggerFactory.getLogger(GeminiTextGenerationService.class);
 
     public GeminiTextGenerationService(VertexAI client, String modelId) {
@@ -57,7 +56,7 @@ public Flux<StreamingTextContent> getStreamingTextContentsAsync(
         return this
             .internalGetTextAsync(prompt, executionSettings)
             .flatMapMany(it -> Flux.fromStream(it.stream())
-                .map(StreamingTextContent::new));
+                .map(GeminiStreamingTextContent::new));
     }
 
     private Mono<List<TextContent>> internalGetTextAsync(String prompt,
@@ -124,6 +123,7 @@ private GenerativeModel getGenerativeModel(
 
     public static class Builder extends
         GeminiServiceBuilder<GeminiTextGenerationService, GeminiTextGenerationService.Builder> {
+
         @Override
         public GeminiTextGenerationService build() {
             if (this.client == null) {
 
@@ -9,7 +9,7 @@
 import com.microsoft.semantickernel.exceptions.SKException;
 import com.microsoft.semantickernel.orchestration.FunctionResultMetadata;
 import com.microsoft.semantickernel.orchestration.PromptExecutionSettings;
-import com.microsoft.semantickernel.services.textcompletion.StreamingTextContent;
+import com.microsoft.semantickernel.services.StreamingTextContent;
 import com.microsoft.semantickernel.services.textcompletion.TextContent;
 import com.microsoft.semantickernel.services.textcompletion.TextGenerationService;
 import java.util.List;
 
@@ -56,6 +56,7 @@
 import com.microsoft.semantickernel.services.chatcompletion.ChatCompletionService;
 import com.microsoft.semantickernel.services.chatcompletion.ChatHistory;
 import com.microsoft.semantickernel.services.chatcompletion.ChatMessageContent;
+import com.microsoft.semantickernel.services.chatcompletion.StreamingChatContent;
 import com.microsoft.semantickernel.services.chatcompletion.message.ChatMessageContentType;
 import com.microsoft.semantickernel.services.chatcompletion.message.ChatMessageImageContent;
 import com.microsoft.semantickernel.services.openai.OpenAiServiceBuilder;
@@ -64,6 +65,7 @@
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.List;
+import java.util.Locale;
 import java.util.Map;
 import java.util.Objects;
 import java.util.stream.Collectors;
@@ -179,6 +181,92 @@ public Mono<List<ChatMessageContent<?>>> getChatMessageContentsAsync(
             });
     }
 
+    @Override
+    public Flux<StreamingChatContent<?>> getStreamingChatMessageContentsAsync(
+        ChatHistory chatHistory,
+        @Nullable Kernel kernel,
+        @Nullable InvocationContext invocationContext) {
+        if (invocationContext != null && invocationContext.getToolCallBehavior()
+            .isAutoInvokeAllowed()) {
+            throw new SKException(
+                "Auto invoke is not supported for streaming chat message contents");
+        }
+
+        if (invocationContext != null
+            && invocationContext.returnMode() != InvocationReturnMode.NEW_MESSAGES_ONLY) {
+            throw new SKException(
+                "Streaming chat message contents only supports NEW_MESSAGES_ONLY return mode");
+        }
+
+        List<ChatRequestMessage> chatRequestMessages = getChatRequestMessages(chatHistory);
+
+        ChatMessages messages = new ChatMessages(chatRequestMessages);
+
+        List<OpenAIFunction> functions = new ArrayList<>();
+        if (kernel != null) {
+            kernel.getPlugins()
+                .forEach(plugin -> plugin.getFunctions().forEach((name, function) -> functions
+                    .add(OpenAIFunction.build(function.getMetadata(), plugin.getName()))));
+        }
+
+        ChatCompletionsOptions options = executeHook(
+            invocationContext,
+            kernel,
+            new PreChatCompletionEvent(
+                getCompletionsOptions(
+                    this,
+                    messages.allMessages,
+                    functions,
+                    invocationContext)))
+            .getOptions();
+
+        return getClient()
+            .getChatCompletionsStreamWithResponse(
+                getDeploymentName(),
+                options,
+                OpenAIRequestSettings.getRequestOptions())
+            .flatMap(completionsResult -> {
+                if (completionsResult.getStatusCode() >= 400) {
+                    //SemanticKernelTelemetry.endSpanWithError(span);
+                    return Mono.error(new AIException(ErrorCodes.SERVICE_ERROR,
+                        "Request failed: " + completionsResult.getStatusCode()));
+                }
+                //SemanticKernelTelemetry.endSpanWithUsage(span, completionsResult.getValue().getUsage());
+
+                return Mono.just(completionsResult.getValue());
+            })
+            .flatMap(completions -> {
+                return Flux.fromIterable(completions.getChoices())
+                    .map(message -> {
+                        AuthorRole role = message.getDelta().getRole() == null
+                            ? AuthorRole.ASSISTANT
+                            : AuthorRole.valueOf(message.getDelta().getRole().toString()
+                                .toUpperCase(Locale.ROOT));
+
+                        return new OpenAIStreamingChatMessageContent<>(
+                            completions.getId(),
+                            role,
+                            message.getDelta().getContent(),
+                            getModelId(),
+                            null,
+                            null,
+                            null,
+                            Arrays.asList());
+                    });
+            });
+    }
+
+    @Override
+    public Flux<StreamingChatContent<?>> getStreamingChatMessageContentsAsync(
+        String prompt,
+        @Nullable Kernel kernel,
+        @Nullable InvocationContext invocationContext) {
+        return getStreamingChatMessageContentsAsync(
+            new ChatHistory().addUserMessage(prompt),
+            kernel,
+            invocationContext);
+    }
+
     // Holds messages temporarily as we build up our result
     private static class ChatMessages {
 
 
@@ -0,0 +1,41 @@
+// Copyright (c) Microsoft. All rights reserved.
+package com.microsoft.semantickernel.aiservices.openai.chatcompletion;
+
+import com.microsoft.semantickernel.orchestration.FunctionResultMetadata;
+import com.microsoft.semantickernel.services.chatcompletion.AuthorRole;
+import com.microsoft.semantickernel.services.chatcompletion.StreamingChatContent;
+import java.nio.charset.Charset;
+import java.util.List;
+import javax.annotation.Nullable;
+
+public class OpenAIStreamingChatMessageContent<T> extends OpenAIChatMessageContent<T> implements
+    StreamingChatContent<T> {
+
+    private final String id;
+
+    public OpenAIStreamingChatMessageContent(
+        String id,
+        AuthorRole authorRole,
+        String content,
+        @Nullable String modelId,
+        @Nullable T innerContent,
+        @Nullable Charset encoding,
+        @Nullable FunctionResultMetadata metadata,
+        @Nullable List<OpenAIFunctionToolCall> toolCall) {
+        super(
+            authorRole,
+            content,
+            modelId,
+            innerContent,
+            encoding,
+            metadata,
+            toolCall);
+
+        this.id = id;
+    }
+
+    @Override
+    public String getId() {
+        return id;
+    }
+}
@@ -0,0 +1,34 @@
+// Copyright (c) Microsoft. All rights reserved.
+package com.microsoft.semantickernel.aiservices.openai.textcompletion;
+
+import com.microsoft.semantickernel.services.StreamingTextContent;
+import com.microsoft.semantickernel.services.textcompletion.TextContent;
+
+import javax.annotation.Nullable;
+
+/**
+ * StreamingTextContent is a wrapper for TextContent that allows for streaming.
+ */
+public class OpenAIStreamingTextContent extends StreamingTextContent<TextContent> {
+
+    /**
+     * Initializes a new instance of the {@code StreamingTextContent} class with a provided text
+     * content.
+     *
+     * @param content The text content.
+     */
+    public OpenAIStreamingTextContent(TextContent content) {
+        super(content, 0, null, null);
+    }
+
+    @Override
+    @Nullable
+    public String getContent() {
+        TextContent content = getInnerContent();
+        if (content == null) {
+            return null;
+        }
+        return content.getContent();
+    }
+
+}