文生图
千问文生图官网地址: bailian.console.aliyun.com/?spm=5176.2…
开发
新建Module
pom文件
<?xml version="1.0" encoding="UTF-8"?>
<project xmlns="http://maven.apache.org/POM/4.0.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
<modelVersion>4.0.0</modelVersion>
<parent>
<groupId>com.miao</groupId>
<artifactId>SpringAIAlibaba-test01</artifactId>
<version>1.0-SNAPSHOT</version>
</parent>
<artifactId>SAA-07Text2Imgae</artifactId>
<properties>
<maven.compiler.source>17</maven.compiler.source>
<maven.compiler.target>17</maven.compiler.target>
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
</properties>
<dependencies>
<dependency>
<groupId>org.springframework.boot</groupId>
<artifactId>spring-boot-starter-web</artifactId>
</dependency>
<!-- 模型服务灵积 调用alibaba生态的协议 对标openai协议 -->
<dependency>
<groupId>com.alibaba.cloud.ai</groupId>
<artifactId>spring-ai-alibaba-starter-dashscope</artifactId>
<version>1.0.0.2</version>
</dependency>
<dependency>
<groupId>org.projectlombok</groupId>
<artifactId>lombok</artifactId>
<version>1.18.38</version>
</dependency>
</dependencies>
</project>
yml
server:
port: 8082
servlet:
encoding:
enabled: true
force: true
charset: UTF-8
spring:
application:
name: SAA-07
ai:
dashscope:
api-key: ${qwen-api-key}
# url: https://dashscope.aliyuncs.com/api/v1
# model: qwen-image-plus
启动类
package com.miao;
import org.springframework.boot.SpringApplication;
import org.springframework.boot.autoconfigure.SpringBootApplication;
@SpringBootApplication
public class SAA07Text2ImageApplication {
public static void main(String[] args) {
SpringApplication.run(SAA07Text2ImageApplication.class, args);
}
}
业务
package com.miao.controller;
import com.alibaba.cloud.ai.dashscope.image.DashScopeImageOptions;
import jakarta.annotation.Resource;
import org.springframework.ai.image.ImageMessage;
import org.springframework.ai.image.ImageModel;
import org.springframework.ai.image.ImagePrompt;
import org.springframework.web.bind.annotation.GetMapping;
import org.springframework.web.bind.annotation.RequestParam;
import org.springframework.web.bind.annotation.RestController;
@RestController
public class Text2ImageController {
public static final String IMAGE_MODEL = "wan2.5-t2i-preview";
@Resource
private ImageModel imageModel;
// 生成图片 URL
@GetMapping(value = "/image")
public String image(@RequestParam(name = "prompt") String prompt) {
// message
ImageMessage imageMessage = new ImageMessage(prompt);
// 使用模型
DashScopeImageOptions dashScopeImageOptions = DashScopeImageOptions.builder()
.withModel(IMAGE_MODEL).build();
// 提示
ImagePrompt imagePrompt = new ImagePrompt(imageMessage, dashScopeImageOptions);
return imageModel.call(imagePrompt)
.getResult()
.getOutput()
.getUrl();
}
}
文生音 CosyVoice
语音合成,又称文本转语音(Text-to-Speech,TTS),是将文本转换为自然语音的技术。该技术基于机器学习算法,通过学习大量语音样本,掌握语言的韵律、语调和发音规则,从而在接收到文本输入时生成真人般自然的语音内容。
官网文档: bailian.console.aliyun.com/?spm=5176.2…
文档2: help.aliyun.com/zh/model-st…
调用逻辑
同步调用、异步调用、流式调用
同步调用
异步调用
流式调用
开发步骤
YML
server:
port: 8082
servlet:
encoding:
enabled: true
force: true
charset: UTF-8
spring:
application:
name: SAA-07
ai:
dashscope:
api-key: ${qwen-api-key}
# url: https://dashscope.aliyuncs.com/api/v1
# model: qwen-image-plus
POM文件
<?xml version="1.0" encoding="UTF-8"?>
<project xmlns="http://maven.apache.org/POM/4.0.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
<modelVersion>4.0.0</modelVersion>
<parent>
<groupId>com.miao</groupId>
<artifactId>SpringAIAlibaba-test01</artifactId>
<version>1.0-SNAPSHOT</version>
</parent>
<artifactId>SAA-07Text2Imgae</artifactId>
<properties>
<maven.compiler.source>17</maven.compiler.source>
<maven.compiler.target>17</maven.compiler.target>
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
</properties>
<dependencies>
<dependency>
<groupId>org.springframework.boot</groupId>
<artifactId>spring-boot-starter-web</artifactId>
</dependency>
<!-- 模型服务灵积 调用alibaba生态的协议 对标openai协议 -->
<dependency>
<groupId>com.alibaba.cloud.ai</groupId>
<artifactId>spring-ai-alibaba-starter-dashscope</artifactId>
<version>1.0.0.2</version>
</dependency>
<dependency>
<groupId>org.projectlombok</groupId>
<artifactId>lombok</artifactId>
<version>1.18.38</version>
</dependency>
</dependencies>
</project>
业务实现类
package com.miao.controller;
import com.alibaba.cloud.ai.dashscope.image.DashScopeImageOptions;
import jakarta.annotation.Resource;
import org.springframework.ai.image.ImageMessage;
import org.springframework.ai.image.ImageModel;
import org.springframework.ai.image.ImagePrompt;
import org.springframework.web.bind.annotation.GetMapping;
import org.springframework.web.bind.annotation.RequestParam;
import org.springframework.web.bind.annotation.RestController;
@RestController
public class Text2ImageController {
public static final String IMAGE_MODEL = "wan2.5-t2i-preview";
@Resource
private ImageModel imageModel;
// 生成图片 URL
@GetMapping(value = "/image")
public String image(@RequestParam(name = "prompt") String prompt) {
// message
ImageMessage imageMessage = new ImageMessage(prompt);
// 使用模型
DashScopeImageOptions dashScopeImageOptions = DashScopeImageOptions.builder()
.withModel(IMAGE_MODEL).build();
// 提示
ImagePrompt imagePrompt = new ImagePrompt(imageMessage, dashScopeImageOptions);
return imageModel.call(imagePrompt)
.getResult()
.getOutput()
.getUrl();
}
}