文生图 + 文生音

39 阅读1分钟

文生图

千问文生图官网地址: bailian.console.aliyun.com/?spm=5176.2…

开发

新建Module

image.png

pom文件

<?xml version="1.0" encoding="UTF-8"?>
<project xmlns="http://maven.apache.org/POM/4.0.0"
         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
    <modelVersion>4.0.0</modelVersion>
    <parent>
        <groupId>com.miao</groupId>
        <artifactId>SpringAIAlibaba-test01</artifactId>
        <version>1.0-SNAPSHOT</version>
    </parent>

    <artifactId>SAA-07Text2Imgae</artifactId>

    <properties>
        <maven.compiler.source>17</maven.compiler.source>
        <maven.compiler.target>17</maven.compiler.target>
        <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
    </properties>
    <dependencies>
        <dependency>
            <groupId>org.springframework.boot</groupId>
            <artifactId>spring-boot-starter-web</artifactId>
        </dependency>

        <!--  模型服务灵积  调用alibaba生态的协议 对标openai协议   -->
        <dependency>
            <groupId>com.alibaba.cloud.ai</groupId>
            <artifactId>spring-ai-alibaba-starter-dashscope</artifactId>
            <version>1.0.0.2</version>
        </dependency>

        <dependency>
            <groupId>org.projectlombok</groupId>
            <artifactId>lombok</artifactId>
            <version>1.18.38</version>
        </dependency>
    </dependencies>
</project>

yml

server:
  port: 8082
  servlet:
    encoding:
      enabled: true
      force: true
      charset: UTF-8

spring:
  application:
    name: SAA-07
  ai:
    dashscope:
      api-key: ${qwen-api-key}
#      url: https://dashscope.aliyuncs.com/api/v1
#      model: qwen-image-plus

启动类

package com.miao;

import org.springframework.boot.SpringApplication;
import org.springframework.boot.autoconfigure.SpringBootApplication;

@SpringBootApplication
public class SAA07Text2ImageApplication {
    public static void main(String[] args) {
        SpringApplication.run(SAA07Text2ImageApplication.class, args);
    }
}

业务

package com.miao.controller;

import com.alibaba.cloud.ai.dashscope.image.DashScopeImageOptions;
import jakarta.annotation.Resource;
import org.springframework.ai.image.ImageMessage;
import org.springframework.ai.image.ImageModel;
import org.springframework.ai.image.ImagePrompt;
import org.springframework.web.bind.annotation.GetMapping;
import org.springframework.web.bind.annotation.RequestParam;
import org.springframework.web.bind.annotation.RestController;

@RestController
public class Text2ImageController {
    public static final String IMAGE_MODEL = "wan2.5-t2i-preview";

    @Resource
    private ImageModel imageModel;

    
    // 生成图片 URL
    @GetMapping(value = "/image")
    public String image(@RequestParam(name = "prompt") String prompt) {
        // message
        ImageMessage imageMessage = new ImageMessage(prompt);

        // 使用模型
        DashScopeImageOptions dashScopeImageOptions = DashScopeImageOptions.builder()
                .withModel(IMAGE_MODEL).build();

        // 提示
        ImagePrompt imagePrompt = new ImagePrompt(imageMessage, dashScopeImageOptions);

        return imageModel.call(imagePrompt)
                .getResult()
                .getOutput()
                .getUrl();
    }
}

文生音 CosyVoice

语音合成,又称文本转语音(Text-to-Speech,TTS),是将文本转换为自然语音的技术。该技术基于机器学习算法,通过学习大量语音样本,掌握语言的韵律、语调和发音规则,从而在接收到文本输入时生成真人般自然的语音内容。

官网文档: bailian.console.aliyun.com/?spm=5176.2…

文档2: help.aliyun.com/zh/model-st…

调用逻辑

同步调用、异步调用、流式调用

同步调用

image.png

异步调用

image.png

流式调用

image.png

开发步骤

YML

server:
  port: 8082
  servlet:
    encoding:
      enabled: true
      force: true
      charset: UTF-8

spring:
  application:
    name: SAA-07
  ai:
    dashscope:
      api-key: ${qwen-api-key}
#      url: https://dashscope.aliyuncs.com/api/v1
#      model: qwen-image-plus

POM文件

<?xml version="1.0" encoding="UTF-8"?>
<project xmlns="http://maven.apache.org/POM/4.0.0"
         xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
         xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
    <modelVersion>4.0.0</modelVersion>
    <parent>
        <groupId>com.miao</groupId>
        <artifactId>SpringAIAlibaba-test01</artifactId>
        <version>1.0-SNAPSHOT</version>
    </parent>

    <artifactId>SAA-07Text2Imgae</artifactId>

    <properties>
        <maven.compiler.source>17</maven.compiler.source>
        <maven.compiler.target>17</maven.compiler.target>
        <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
    </properties>
    <dependencies>
        <dependency>
            <groupId>org.springframework.boot</groupId>
            <artifactId>spring-boot-starter-web</artifactId>
        </dependency>

        <!--  模型服务灵积  调用alibaba生态的协议 对标openai协议   -->
        <dependency>
            <groupId>com.alibaba.cloud.ai</groupId>
            <artifactId>spring-ai-alibaba-starter-dashscope</artifactId>
            <version>1.0.0.2</version>
        </dependency>

        <dependency>
            <groupId>org.projectlombok</groupId>
            <artifactId>lombok</artifactId>
            <version>1.18.38</version>
        </dependency>
    </dependencies>
</project>

业务实现类

package com.miao.controller;

import com.alibaba.cloud.ai.dashscope.image.DashScopeImageOptions;
import jakarta.annotation.Resource;
import org.springframework.ai.image.ImageMessage;
import org.springframework.ai.image.ImageModel;
import org.springframework.ai.image.ImagePrompt;
import org.springframework.web.bind.annotation.GetMapping;
import org.springframework.web.bind.annotation.RequestParam;
import org.springframework.web.bind.annotation.RestController;

@RestController
public class Text2ImageController {
    public static final String IMAGE_MODEL = "wan2.5-t2i-preview";

    @Resource
    private ImageModel imageModel;


    // 生成图片 URL
    @GetMapping(value = "/image")
    public String image(@RequestParam(name = "prompt") String prompt) {
        // message
        ImageMessage imageMessage = new ImageMessage(prompt);

        // 使用模型
        DashScopeImageOptions dashScopeImageOptions = DashScopeImageOptions.builder()
                .withModel(IMAGE_MODEL).build();

        // 提示
        ImagePrompt imagePrompt = new ImagePrompt(imageMessage, dashScopeImageOptions);

        return imageModel.call(imagePrompt)
                .getResult()
                .getOutput()
                .getUrl();
    }
}