feat: Batch Image Generation

Onion99 · Onion99 · commit 27d1dda3ca71 · 2026-03-12T18:51:41.000+08:00
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -5,6 +5,14 @@
 本项目遵循 [语义化版本](https://semver.org/spec/v2.0.0.html)。
 
 
+## v5.6.0
+
+### ✨ New Features
+- **Batch Image Generation**:
+  - Added support for generating multiple images in a single batch (1-10 images per request).
+  - Configurable "Batch Size" (生成数量) slider in Generation Quality settings.
+  - Real-time sequential generation display with progress tracking (e.g., `(1/4)`, `(2/4)`) directly in the chat interface.
+
 ## v5.5.0
 
 - **Sampling Methods**:
diff --git a/composeApp/src/commonMain/composeResources/values-zh/strings.xml b/composeApp/src/commonMain/composeResources/values-zh/strings.xml
@@ -50,6 +50,8 @@
     <string name="settings_cfg_scale_description">低 = 创意 | 高 = 精准</string>
     <string name="settings_sampler">采样方法</string>
     <string name="settings_sampler_desc">选择用于图像去噪的生成算法</string>
+    <string name="settings_batch_count">生成数量</string>
+    <string name="settings_batch_count_description">一次生成的图片数量</string>
     <string name="settings_current_configuration">当前配置</string>
     <string name="settings_advanced_title">高级设置</string>
     <string name="settings_advanced_subtitle">性能调优与实验性功能</string>
diff --git a/composeApp/src/commonMain/composeResources/values/strings.xml b/composeApp/src/commonMain/composeResources/values/strings.xml
@@ -51,6 +51,8 @@
     <string name="settings_cfg_scale_description">Low = Creative | High = Precise</string>
     <string name="settings_sampler">Sampling Method</string>
     <string name="settings_sampler_desc">Select the algorithm used to denoise the image</string>
+    <string name="settings_batch_count">Batch Size</string>
+    <string name="settings_batch_count_description">Number of images to generate</string>
     <string name="settings_current_configuration">Current Configuration</string>
     <string name="settings_advanced_title">Advanced Settings</string>
     <string name="settings_advanced_subtitle">Experimental features and optimizations</string>
diff --git a/composeApp/src/commonMain/kotlin/org/onion/diffusion/ui/screen/HomeScreen.kt b/composeApp/src/commonMain/kotlin/org/onion/diffusion/ui/screen/HomeScreen.kt
@@ -360,7 +360,13 @@ private fun ChatMessagesList(chatMessages: List<ChatMessage>,snackbarHostState:
                             }
                         },
                         onRegenerate = if (message.metadata?.containsKey("prompt") == true) {
-                            { chatViewModel.reGenerateMessage(message) }
+                            {
+                                if (chatViewModel.isGenerating.value) {
+                                    coroutineScope.launch {
+                                        snackbarHostState.showSnackbar(getString(Res.string.error_no_interrupt_api))
+                                    }
+                                }else chatViewModel.reGenerateMessage(message)
+                            }
                         } else null,
                         onCopyText = { textToCopy ->
                             clipboardManager.setText(AnnotatedString(textToCopy))
diff --git a/composeApp/src/commonMain/kotlin/org/onion/diffusion/ui/screen/SettingScreen.kt b/composeApp/src/commonMain/kotlin/org/onion/diffusion/ui/screen/SettingScreen.kt
@@ -69,6 +69,8 @@ import minediffusion.composeapp.generated.resources.settings_cfg_scale
 import minediffusion.composeapp.generated.resources.settings_cfg_scale_description
 import minediffusion.composeapp.generated.resources.settings_sampler
 import minediffusion.composeapp.generated.resources.settings_sampler_desc
+import minediffusion.composeapp.generated.resources.settings_batch_count
+import minediffusion.composeapp.generated.resources.settings_batch_count_description
 import minediffusion.composeapp.generated.resources.settings_current_configuration
 import minediffusion.composeapp.generated.resources.settings_flash_attn
 import minediffusion.composeapp.generated.resources.settings_flash_attn_desc
@@ -123,6 +125,7 @@ fun SettingScreen(
     // Direct access to mutableStateOf properties (singleton ViewModel)
     val currentWidth by chatViewModel.imageWidth
     val currentHeight by chatViewModel.imageHeight
+    val currentBatchCount by chatViewModel.batchCount
     val currentSteps by chatViewModel.generationSteps
     val currentCfg by chatViewModel.cfgScale
     val currentSampler by chatViewModel.sampleMethod
@@ -197,6 +200,21 @@ fun SettingScreen(
                 subtitle = stringResource(Res.string.settings_generation_quality_subtitle),
                 icon = Icons.Default.Tune
             ) {
+                // Batch Count Slider
+                SliderSetting(
+                    label = stringResource(Res.string.settings_batch_count),
+                    value = currentBatchCount.toFloat(),
+                    valueRange = 1f..10f,
+                    steps = 8,
+                    valueDisplay = currentBatchCount.toString(),
+                    description = stringResource(Res.string.settings_batch_count_description),
+                    onValueChange = { value ->
+                        chatViewModel.batchCount.value = value.toInt()
+                    }
+                )
+                
+                Spacer(modifier = Modifier.height(24.dp))
+                
                 // Steps Slider
                 SliderSetting(
                     label = stringResource(Res.string.settings_steps),
diff --git a/composeApp/src/commonMain/kotlin/org/onion/diffusion/viewmodel/ChatViewModel.kt b/composeApp/src/commonMain/kotlin/org/onion/diffusion/viewmodel/ChatViewModel.kt
@@ -72,6 +72,9 @@ class ChatViewModel  : ViewModel() {
     /** Image height - options: 128, 256, 512, 768, 1024 */
     var imageHeight = mutableStateOf(512)
     
+    /** Batch count - number of images to generate */
+    var batchCount = mutableStateOf(1)
+    
     /** Steps for generation - range: 1-50 */
     var generationSteps = mutableStateOf(5)
     
@@ -236,67 +239,80 @@ class ChatViewModel  : ViewModel() {
                     println("Image prompt: $promptContent")
                     println("Image negative: $negativeContent")
                     // Call txt2Img to generate image from the query prompt
-                    val startTime = Clock.System.now().toEpochMilliseconds()
 
                     val enabledLoras = loraList.filter { it.isEnabled }
                     val loraPaths = enabledLoras.map { it.path }.toTypedArray()
                     val loraStrengths = enabledLoras.map { it.strength }.toFloatArray()
 
-                    val imageByteArray = diffusionLoader.txt2Img(
-                        prompt = promptContent,
-                        negative = negativeContent,
-                        // 768×1024（竖版人像）/ 1024×768（横版场景）/ 1024×1344（高清竖版）
-                        width = imageWidth.value,
-                        height = imageHeight.value,
-                        steps = generationSteps.value,//模型渲染细节的 “迭代次数”，步数越多细节越丰富，但耗时越长（20-30 步性价比最高）
-                        cfg = cfgScale.value,// 控制模型 “遵守正向提示词” 的严格程度，数值越高越贴合提示词，越低越自由发挥（7.0-9.0 最常用）
-                        seed = Clock.System.now().toEpochMilliseconds(),
-                        sampleMethod = sampleMethod.value,
-                        loraPaths = loraPaths,
-                        loraStrengths = loraStrengths
-                    )
-
-                    // Debug logging to verify image format
-                    println("=== Image Generation Debug ===")
-                    println("Image size: ${imageByteArray?.size} bytes")
-                    if (imageByteArray != null && imageByteArray.size >= 10) {
-                        println("First 10 bytes: ${imageByteArray.take(10).joinToString { it.toString() }}")
-                        // PNG signature: 137 80 78 71 13 10 26 10 (需要使用 and 0xFF 转换为无符号值)
-                        // JPEG signature: 255 216 255
-                        val isPNG = imageByteArray.size >= 8 &&
-                                imageByteArray[0].toInt() and 0xFF == 137 &&
-                                imageByteArray[1].toInt() and 0xFF == 80 &&
-                                imageByteArray[2].toInt() and 0xFF == 78 &&
-                                imageByteArray[3].toInt() and 0xFF == 71
-                        val isJPEG = imageByteArray.size >= 3 &&
-                                imageByteArray[0].toInt() and 0xFF == 255 &&
-                                imageByteArray[1].toInt() and 0xFF == 216
-                        println("Format detection - PNG: $isPNG, JPEG: $isJPEG")
-                    }
-                    println("==============================")
-                    // Update the last message in the chat with the generated image
-                    // Using removeAt + add instead of index assignment to trigger recomposition
-                    if (_currentChatMessages.isNotEmpty()) {
-                        val lastIndex = _currentChatMessages.lastIndex
-                        _currentChatMessages.removeAt(lastIndex)
-                        val generationDuration = Clock.System.now().toEpochMilliseconds() - startTime
-                        val msg = getString(Res.string.image_generation_finished).replace("%s", formatDuration(generationDuration))
-                        val metadata = mapOf(
-                            "prompt" to promptContent,
-                            "negative_prompt" to negativeContent,
-                            "steps" to generationSteps.value.toString(),
-                            "cfg_scale" to cfgScale.value.toString(),
-                            "seed" to Clock.System.now().toEpochMilliseconds().toString(), // Note: verify if we should use the same seed as generation
-                            "model" to diffusionModelPath.value.substringAfterLast("/"),
-                             "loras" to enabledLoras.joinToString(",") { "${it.name}:${it.strength}" }
+                    var first = true
+                    for (i in 0 until batchCount.value) {
+                        val startTime = Clock.System.now().toEpochMilliseconds()
+                        val imageByteArray = diffusionLoader.txt2Img(
+                            prompt = promptContent,
+                            negative = negativeContent,
+                            // 768×1024（竖版人像）/ 1024×768（横版场景）/ 1024×1344（高清竖版）
+                            width = imageWidth.value,
+                            height = imageHeight.value,
+                            steps = generationSteps.value,//模型渲染细节的 “迭代次数”，步数越多细节越丰富，但耗时越长（20-30 步性价比最高）
+                            cfg = cfgScale.value,// 控制模型 “遵守正向提示词” 的严格程度，数值越高越贴合提示词，越低越自由发挥（7.0-9.0 最常用）
+                            seed = Clock.System.now().toEpochMilliseconds(),
+                            sampleMethod = sampleMethod.value,
+                            loraPaths = loraPaths,
+                            loraStrengths = loraStrengths
                         )
 
-                        _currentChatMessages.add(lastIndex, ChatMessage(
-                            message = msg,
-                            isUser = false,
-                            image = imageByteArray,
-                            metadata = metadata
-                        ))
+                        // Debug logging to verify image format
+                        println("=== Image Generation Debug ===")
+                        println("Image size: ${imageByteArray?.size} bytes")
+                        if (imageByteArray != null && imageByteArray.size >= 10) {
+                            println("First 10 bytes: ${imageByteArray.take(10).joinToString { it.toString() }}")
+                            // PNG signature: 137 80 78 71 13 10 26 10 (需要使用 and 0xFF 转换为无符号值)
+                            // JPEG signature: 255 216 255
+                            val isPNG = imageByteArray.size >= 8 &&
+                                    imageByteArray[0].toInt() and 0xFF == 137 &&
+                                    imageByteArray[1].toInt() and 0xFF == 80 &&
+                                    imageByteArray[2].toInt() and 0xFF == 78 &&
+                                    imageByteArray[3].toInt() and 0xFF == 71
+                            val isJPEG = imageByteArray.size >= 3 &&
+                                    imageByteArray[0].toInt() and 0xFF == 255 &&
+                                    imageByteArray[1].toInt() and 0xFF == 216
+                            println("Format detection - PNG: $isPNG, JPEG: $isJPEG")
+                        }
+                        println("==============================")
+                        // Update the last message in the chat with the generated image
+                        // Using removeAt + add instead of index assignment to trigger recomposition
+                        if (_currentChatMessages.isNotEmpty()) {
+                            val lastIndex = _currentChatMessages.lastIndex
+                            if (first) {
+                                _currentChatMessages.removeAt(lastIndex)
+                                first = false
+                            } else {
+                                _currentChatMessages.removeAt(lastIndex)
+                            }
+                            val generationDuration = Clock.System.now().toEpochMilliseconds() - startTime
+                            val batchStr = if (batchCount.value > 1) " (${i + 1}/${batchCount.value})" else ""
+                            val msg = getString(Res.string.image_generation_finished).replace("%s", formatDuration(generationDuration)) + batchStr
+                            val metadata = mapOf(
+                                "prompt" to promptContent,
+                                "negative_prompt" to negativeContent,
+                                "steps" to generationSteps.value.toString(),
+                                "cfg_scale" to cfgScale.value.toString(),
+                                "seed" to Clock.System.now().toEpochMilliseconds().toString(), // Note: verify if we should use the same seed as generation
+                                "model" to diffusionModelPath.value.substringAfterLast("/"),
+                                 "loras" to enabledLoras.joinToString(",") { "${it.name}:${it.strength}" }
+                            )
+
+                            _currentChatMessages.add(ChatMessage(
+                                message = msg,
+                                isUser = false,
+                                image = imageByteArray,
+                                metadata = metadata
+                            ))
+                            
+                            if (i < batchCount.value - 1) {
+                                _currentChatMessages.add(ChatMessage("", false))
+                            }
+                        }
                     }
                 }
                 isGenerating.value = false
diff --git a/gradle/libs.versions.toml b/gradle/libs.versions.toml
@@ -1,6 +1,6 @@
 [versions]
 agp = "8.9.1"
-app-version="5.5.0"
+app-version="5.6.0"
 android-compileSdk = "36"
 android-minSdk ="29"
 android-targetSdk = "35"