codeproject
diff --git a/‎.gitignore‎
Lines changed: 18 additions & 0 deletions b/‎.gitignore‎
Lines changed: 18 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 51 additions & 0 deletions b/‎README.md‎
Lines changed: 51 additions & 0 deletions
diff --git a/‎Text2Image.pyproj‎
Lines changed: 62 additions & 0 deletions b/‎Text2Image.pyproj‎
Lines changed: 62 additions & 0 deletions
diff --git a/‎explore.html‎
Lines changed: 235 additions & 0 deletions b/‎explore.html‎
Lines changed: 235 additions & 0 deletions
diff --git a/‎install.bat‎
Lines changed: 8 additions & 0 deletions b/‎install.bat‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎install.sh‎
Lines changed: 8 additions & 0 deletions b/‎install.sh‎
Lines changed: 8 additions & 0 deletions
@@ -0,0 +1,18 @@
+# Misc
+.DS_Store
+
+# Python cache
+__pycache__/
+*.pyc
+
+# debug debris
+plate.png
+
+# Generated package files
+*-[0-9]*.[0-9]*.[0-9]*.zip
+
+# Models
+paddleocr
+
+# Python install / Virtual environment
+bin/
@@ -0,0 +1,51 @@
+# Text-to-Image Module for CodeProject.AI Server
+
+This is a Text-to-Image module using the for [CodeProject.AI Server](https://www.codeproject.com/Articles/5322557/CodeProject-AI-Server-AI-the-easy-way). The actual module itself is downloadable via the CodeProject.AI Server's dashboard.
+
+## To develop and debug this code
+
+1. Clone the main [server repo](https://github.com/codeproject/CodeProject.AI-Server) into a directory such as `CodeProject/CodeProject.AI-Server`
+
+2. Clone this Text2Image repo into a separate folder `CodeProject/CodeProject.AI-Modules`
+
+    You should now have
+
+    ```text
+    CodeProject
+      - CodeProject.AI-Server
+         - demos
+         - src
+         - ... etc
+      - CodeProject.AI-Modules
+         - CodeProject.AI-Text2Image (this repo)
+    ```
+
+3. **If you have NOT run dev setup on the server**
+    Run the server dev setup scripts by opening a terminal in `CodeProject.AI-Server/src/` then, for Windows, run `setup.bat`, or for Linux/macOS run `bash setup.sh`.<br>
+    This will setup the server, and will also setup this module as long as this module sits under a folder named `CodeProject.AI-Modules`, with `CodeProject.AI-Modules` being at the same folder level as `CodeProject.AI-Server`.
+
+    **If you have already setup the server**
+    You can run the setup for just this module running the setup script from a terminal opened in this folder
+   ```BAT
+   REM For Windows
+   ..\..\CodeProject.AI-Server\src\setup.bat
+   ```
+   ```bash
+   # For Linux/macOS
+   bash ../../CodeProject.AI-Server/src/setup.sh
+   ```
+4. Open the server repo in Visual Studio Code (or Visual Studio) and build and launch the server (Build and Launch server in the Run and Debug menu in VS Code). This will start the server, which in turn will load the settings file from this module.
+    <br>You can start this module directly from the CodeProject.AI Server dashboard, or you can run this module as a separate process via the 'Launch Text2Image' Debug and Run option in VS Code.
+
+## To create a package for this module
+
+Assuming the folder structure outlined above, run
+
+   ```BAT
+   REM For Windows
+   ..\..\CodeProject.AI-Server\src\create_packages.bat
+   ```
+   ```bash
+   # For Linux/macOS
+   bash ../../CodeProject.AI-Server/src/create_packages.sh
+   ```
@@ -0,0 +1,62 @@
+<Project DefaultTargets="Build" xmlns="http://schemas.microsoft.com/developer/msbuild/2003" ToolsVersion="4.0">
+  <PropertyGroup>
+    <Configuration Condition=" '$(Configuration)' == '' ">Debug</Configuration>
+    <SchemaVersion>2.0</SchemaVersion>
+    <ProjectGuid>2022ed32-14c4-4ca6-aac3-d58d724805ed</ProjectGuid>
+    <ProjectHome>.</ProjectHome>
+    <StartupFile>stable_diffusion_adapter.py</StartupFile>
+    <SearchPath>
+    </SearchPath>
+    <WorkingDirectory>.</WorkingDirectory>
+    <OutputPath>.</OutputPath>
+    <Name>Text2Image</Name>
+    <RootNamespace>Text2Image</RootNamespace>
+    <InterpreterId>MSBuild|venv|$(MSBuildProjectFullPath)</InterpreterId>
+  </PropertyGroup>
+  <PropertyGroup Condition=" '$(Configuration)' == 'Debug' ">
+    <DebugSymbols>true</DebugSymbols>
+    <EnableUnmanagedDebugging>false</EnableUnmanagedDebugging>
+  </PropertyGroup>
+  <PropertyGroup Condition=" '$(Configuration)' == 'Release' ">
+    <DebugSymbols>true</DebugSymbols>
+    <EnableUnmanagedDebugging>false</EnableUnmanagedDebugging>
+  </PropertyGroup>
+  <ItemGroup>
+    <Compile Include="stable_diffusion.py" />
+    <Compile Include="stable_diffusion_adapter.py" />
+  </ItemGroup>
+  <ItemGroup>
+    <Content Include="explore.html" />
+    <Content Include="install.bat" />
+    <Content Include="install.sh" />
+    <Content Include="modulesettings.json" />
+    <Content Include="requirements.cuda11.txt" />
+    <Content Include="requirements.cuda12.txt" />
+    <Content Include="requirements.macos.arm64.txt" />
+    <Content Include="requirements.macos.txt" />
+    <Content Include="requirements.txt" />
+  </ItemGroup>
+  <ItemGroup>
+    <Interpreter Include="bin\windows\python39\venv\">
+      <Id>venv</Id>
+      <Version>3.9</Version>
+      <Description>venv (Python 3.9 (64-bit))</Description>
+      <InterpreterPath>Scripts\python.exe</InterpreterPath>
+      <WindowsInterpreterPath>Scripts\pythonw.exe</WindowsInterpreterPath>
+      <PathEnvironmentVariable>PYTHONPATH</PathEnvironmentVariable>
+      <Architecture>X64</Architecture>
+    </Interpreter>
+  </ItemGroup>
+  <ItemGroup>
+    <Folder Include="assets\" />
+  </ItemGroup>
+  <Import Project="$(MSBuildExtensionsPath32)\Microsoft\VisualStudio\v$(VisualStudioVersion)\Python Tools\Microsoft.PythonTools.targets" />
+  <!-- Uncomment the CoreCompile target to enable the Build command in
+       Visual Studio and specify your pre- and post-build commands in
+       the BeforeBuild and AfterBuild targets below. -->
+  <!--<Target Name="CoreCompile" />-->
+  <Target Name="BeforeBuild">
+  </Target>
+  <Target Name="AfterBuild">
+  </Target>
+</Project>
@@ -0,0 +1,235 @@
+<!DOCTYPE html>
+<html lang="en" xmlns="http://www.w3.org/1999/xhtml">
+<!--
+CODEPROJECT.AI SERVER MODULE EXPLORER
+
+This page provides the means to test this module using the same infrastructure as
+the CodeProject.AI Server explorer. This page also provides the UI elements that
+the explorer will parse and use to build up the UI of the main explorer itself.
+
+RULES AND CONVENTIONS
+
+1. This page should provide sufficient functionality to test and explore this
+   module.
+
+2. This page should use the functionality in the explorer.js file so that when
+   the elements of this page are inserted into the main explorer, it all works
+   seamlessly. Specifically, you will probably use
+
+   - clearImagePreview:         Clears the image preview area.
+   - previewImage:              Displays an image in the shared image preview area and takes a
+                                input[type=file] as parameter.
+   - submitRequest:             Sends a request to the AI server.
+   - setResultsHtml:            Sets the HTML in the shared 'results' element. Parameter is the HTML
+                                to display.
+   - getProcessingMetadataHtml: Gets HTML representing the common data returned from a call to a
+                                module.
+   - displayBaseResults:        Displays the common data returned from a call to a module.
+   - showPredictionSummary:     Displays in the shared HTML results pane the list of predictions 
+                                returned from an inference operation.
+   - clearImageResult:          Clears the image result area 
+   - showResultsImageData:      Displays an image in the shared image results area using the data
+                                returned from a call to a module, and overlays bounding boxes if
+                                present in the data
+   - showResultsBoundingBoxes:  Displays bounding boxes on the shared image results area based on
+                                the boxes returned in the predictions parameter. The first param is
+                                an array of predictions returned from a computer vision operation.
+
+3. There are 3 parts of this page that will be pulled into the main explorer
+   during runtime: The HTML, the script, and the CSS. These sections are bounded by
+
+    - HTML:   START EXPLORER MARKUP / END EXPLORER MARKUP pair, each within HTML comment brackets
+    - Script: START EXPLORER SCRIPT / END EXPLORER SCRIPT pair, each as a // comment on its own line
+    - CSS:    START EXPLORER STYLE  / END EXPLORER STYLE pair, each inside /* ... */ comments
+
+   These delimiters should be on a line by themselves
+
+4. **Please provide output elements to display the results of operations** if
+   you wish to use the standard HTML / Image results elements in the main explorer
+   
+   - For HTML output, include a DIV with id 'results'
+   - For Image preview, include an IMG element with id imgPreview
+   - For image results, include an IMG with element imgPreview and a DIV with
+     id 'imageMask'.
+   - You can use a single image for both preview and results if you wish by only
+     including a imgPreview image. Make sure you have the imageMask DIV though.
+   - For Sound preview, include an AUDIO element with id 'snd' that contains a
+     SOURCE tag
+
+5. When this file is parsed and injected into the larger explorer, the HTML is
+   injected first, then the script, then the CSS.
+
+6. **To ensure uniqueness of elements** you can include the _MID_ macro in any
+   name. This will be expanded to be [ModuleId]_ where [ModuleId] is the literal
+   ID of this module. For instance <div id="_MID_TextBox"> becomes <div id="MyModuleId_TextBox">
+-->
+<head>
+    <meta charset="utf-8" />
+    <title>Text2Image Module Test</title>
+
+    <link id="bootstrapCss" rel="stylesheet" type="text/css" href="http://localhost:32168/assets/bootstrap-dark.min.css">
+    <!--<link rel="stylesheet" type="text/css" href="http://localhost:32168/assets/server.css?v=2.5.0.0">-->
+    <script type="text/javascript" src="http://localhost:32168/assets/server.js"></script>
+    <script type="text/javascript" src="http://localhost:32168/assets/explorer.js"></script>
+
+    <style>
+/* START EXPLORER STYLE */
+/* END EXPLORER STYLE */
+    </style>
+
+</head>
+<body class="dark-mode">
+<div class="mx-auto" style="max-width: 800px;">
+    <h2 class="mb-3">Text2Image Module Test</h2>
+    <form method="post" action="" enctype="multipart/form-data" id="myform">
+
+<!-- START EXPLORER MARKUP -->
+        <div class="form-group row">
+            <div>
+                <label for="_MID_prompt" class="col-form-label col-2">Prompt</label>
+                <textarea id="_MID_prompt" class="w-100" style="height:100px"
+                    title="The prompt to be used by Stable Diffusion to create the image"></textarea>
+            </div>
+            <div>
+                <label for="_MID_negative_prompt" class="col-form-label">Negative Prompt</label>
+                <textarea id="_MID_negative_prompt" class="w-100" style="height:100px"
+                    title="The negative prompt to be used by Stable Diffusion to create the image"></textarea>
+            </div>
+
+            <div class="row mb-3">
+                <div class="col-4">
+                    <label for"_MID_num_images" class="form-label">Images</label>
+                    <input type="number" id="_MID_num_images" class="form-control" 
+                        min="1" max="4" steps="1" value="1" title="The number of images to generate. Defaults to 1."/>
+                </div>
+                <div class="col-4">
+                    <label for="_MID_seed" class="form-label">Seed</label>
+                    <input id="_MID_seed" class="form-control" type="number" value="0" 
+                        title="The seed to use for the diffusion random number generator. If Fixed is checked will use this value, otherwise uses random value."/>
+                    <label for="_MID_seed_fixed" class="form-check-label" >Fixed</label>
+                    <input id="_MID_seed_fixed" class="form-check-input ms-2" type="checkbox" 
+                            title="If checked, will use the value above rather than a random value. This allows for reproducible image generation."/>
+                </div>
+                <div class="col-4">
+                    <label for="_MID_num_steps" class="form-label">Steps</label>
+                    <input type="number" id="_MID_num_steps" class="form-control" min="1" max="100"
+                        steps="1" value="40" title="The number of inference steps to run"/>
+                </div>
+            </div>
+            <div class="row mb-3">
+                <div class="col-4">
+                    <label for="_MID_guidance" class="form-label">Guidance</label>
+                    <input type="number" id="_MID_guidance" class="form-control" min="0.0" max="20.0" 
+                        steps="0.1" value="7" title="How well the process aligns with the prompt for image generation (0.0 - 20.0)."/>
+                </div>
+                <div class="col-4">
+                    <label for="_MID_width" class="form-label">Width</label>
+                    <input type="number" id="_MID_width" class="form-control" min="128" max="1024" 
+                        steps="8" value="512" title="The width of the image to be created. Defaults to 512. Must be a multiple of 8."/>
+                </div>
+                <div class="col-4">
+                    <label for="_MID_height" class="form-label">Height</label>
+                    <input type="number" id="_MID_height" class="form-control" min="128" max="1024" 
+                        steps="8" value="512" title="The height of the image to be created. Must be a multiple of 8."/>
+                </div>
+            </div>
+            <input id="_MID_generte" class="form-control btn-success" type="button" value="Generate Image"
+                   style="width:11rem" onclick="_MID_onGenerateImages()" />
+        </div>
+<hr>
+<!-- END EXPLORER MARKUP -->
+
+        <div class="w-100 position-relative form-control my-4 p-0">
+            <div id="imgMask" class="position-absolute"
+                    style="left:0;top:0;pointer-events:none;z-index:10"></div>
+            <img src="" id="imgPreview" class="w-100" style="height:250px;visibility:hidden">
+        </div>
+        <div>
+            <h2>Results</h2>
+            <div id="results" name="results" class="bg-light p-3" style="min-height: 100px;"></div>
+        </div>
+
+    </form>
+
+    <script type="text/javascript">
+        // START EXPLORER SCRIPT
+
+        async function _MID_onGenerateImages() {
+
+            clearImagePreview();
+
+            if (!_MID_prompt.value) {
+                alert("No image prompt specified");
+                return;
+            }
+
+            setResultsHtml("Generating Images...");
+            let params = [['prompt',                _MID_prompt.value],
+                          ['num_images_per_prompt', _MID_num_images.value],
+                          ['seed',                  _MID_seed_fixed.checked ? _MID_seed.value : null],
+                          ['num_inference_steps',   _MID_num_steps.value],
+                          ['guidance_scale',        _MID_guidance.value],
+                          ['width',                 _MID_width.value],
+                          ['height',                _MID_height.value]];
+
+            if (_MID_negative_prompt.value != "") {
+                params.push(['negative_prompt', _MID_negative_prompt.value]);
+            }
+
+            let data = await submitRequest('text2image', 'create', null, params);
+            if (data) {
+                // get the commandId to so we can poll for the results
+                _MID_commandId = data.commandId;
+                _MID_moduleId  = data.moduleId;
+
+                params         = [['commandId', _MID_commandId], ['moduleId', _MID_moduleId]];
+                done           = false;
+                loopCount      = 0;
+                spinner        = "|/-\\";
+
+                while (!done) {
+                    
+                    await delay(1000);
+
+                    let results = await submitRequest('text2image', 'get_command_status', null, params);
+                    if (results && results.success) {
+
+                        if (results.commandStatus == "failed") {
+                            done = true;
+                            setResultsHtml(results?.error || "Unknown error");
+                        } 
+                        else {
+                            let message = results.message;
+                            if (results.commandStatus == "completed") {
+                                done = true;
+                                _MID_seed.value = results?.seed || 0;
+                            }
+                            else {
+                                spinChar = spinner.charAt(loopCount++ % spinner.length);
+                                message = spinChar + " " + message;
+                            }
+
+                            setResultsHtml(message);
+
+                            if (results.images && results.images.length > 0)
+                                showResultsImage(results.images[0], results.width, results.height);
+                        }
+                    }
+                    else {
+                        // TODO: check for timeouts and other network errors.
+                        done = true;
+                        // setResultsHtml(results?.error || "No response from server");
+                    }
+                }
+            };
+        }
+
+        // =====================================================================
+        // Startup
+
+
+// END EXPLORER SCRIPT
+    </script>
+</div>
+</body>
+</html>
@@ -0,0 +1,8 @@
+@if "%1" NEQ "install" (
+    echo This script is only called from ..\..\setup.bat
+    @pause
+    @goto:eof
+)
+
+REM Download the YOLO models from the CodeProject models/ folder and store in /assets
+REM call "%sdkScriptsDirPath%\utils.bat" GetFromServer "models/" "models-yolo8-pt.zip" "assets" "Downloading Standard YOLO models..."
@@ -0,0 +1,8 @@
+if [ "$1" != "install" ]; then
+    read -t 3 -p "This script is only called from: bash ../../setup.sh"
+    echo
+    exit 1 
+fi
+
+# Download the YOLO models from the CodeProject models/ folder and store in /assets 
+# getFromServer "models/" "models-yolo8-pt.zip"  "assets" "Downloading Standard YOLO models..."