代码初始化
This commit is contained in:
@@ -2,105 +2,64 @@ package audio
|
||||
|
||||
import (
|
||||
"context"
|
||||
"encoding/json"
|
||||
"strings"
|
||||
|
||||
common "media/controller/common"
|
||||
dto "media/model/dto/audio"
|
||||
service "media/service/asr"
|
||||
|
||||
"gitea.com/red-future/common/beans"
|
||||
"github.com/gogf/gf/v2/frame/g"
|
||||
"github.com/gogf/gf/v2/net/ghttp"
|
||||
)
|
||||
|
||||
type audio struct{}
|
||||
|
||||
var AudioExtract = new(audio)
|
||||
|
||||
// safeResult 对外输出的识别结果(隐藏内部路径)
|
||||
type safeResult struct {
|
||||
Text string `json:"text"`
|
||||
Model string `json:"model"`
|
||||
Language string `json:"language"`
|
||||
AudioSize int64 `json:"audioSize"`
|
||||
AudioDuration string `json:"audioDuration"`
|
||||
Scenes *dto.SceneSummaryDTO `json:"scenes,omitempty"`
|
||||
}
|
||||
|
||||
// safeItem 对外输出的单视频结果
|
||||
type safeItem struct {
|
||||
FileName string `json:"fileName"`
|
||||
Result *safeResult `json:"result,omitempty"`
|
||||
Error string `json:"error,omitempty"`
|
||||
}
|
||||
|
||||
// TranscribeHandler 语音转文字+分镜分析
|
||||
// 支持两种入参方式:
|
||||
// 1. JSON body: {"video_urls":[...], "model":"medium", "language":"zh", "threshold":0.3}
|
||||
// 2. 文件上传: files 参数(兼容单/多文件)
|
||||
func (c *audio) TranscribeHandler(r *ghttp.Request) {
|
||||
ctx := r.Context()
|
||||
ctx = context.WithValue(ctx, "user", &beans.User{UserName: "admin"})
|
||||
|
||||
// 优先尝试 JSON body(URL 列表模式)
|
||||
body := r.GetBody()
|
||||
if len(body) > 0 && body[0] == '{' {
|
||||
var req dto.TranscribeReq
|
||||
if json.Unmarshal(body, &req) == nil && len(req.VideoURLs) > 0 {
|
||||
// 填充默认值
|
||||
if req.Model == "" {
|
||||
req.Model = g.Cfg().MustGet(ctx, "whisper.model", "medium").String()
|
||||
}
|
||||
if req.Language == "" {
|
||||
req.Language = g.Cfg().MustGet(ctx, "whisper.language", "zh").String()
|
||||
}
|
||||
if req.Threshold <= 0 {
|
||||
req.Threshold = 0.3
|
||||
}
|
||||
|
||||
res, svcErr := service.VideoTranscribe.TranscribeWithURLs(ctx, &req)
|
||||
if svcErr != nil {
|
||||
r.Response.WriteJson(g.Map{"code": 500, "message": svcErr.Error()})
|
||||
return
|
||||
}
|
||||
r.Response.WriteJson(g.Map{"code": 200, "message": "success", "data": toSafeItems(res.Results)})
|
||||
return
|
||||
}
|
||||
// Create 创建语音转文字异步任务 POST /audio/transcribe
|
||||
func (c *audio) Create(ctx context.Context, req *dto.TranscribeReq) (res *dto.CreateTaskRes, err error) {
|
||||
ctx = withUser(ctx)
|
||||
fileNames := make([]string, len(req.VideoURLs))
|
||||
for i, u := range req.VideoURLs {
|
||||
parts := strings.Split(u, "/")
|
||||
fileNames[i] = parts[len(parts)-1]
|
||||
}
|
||||
|
||||
// 文件上传模式
|
||||
savePaths, err := common.SaveUploadedFiles(r)
|
||||
if err != nil || len(savePaths) == 0 {
|
||||
r.Response.WriteJson(g.Map{"code": 400, "message": "请上传视频文件( multipart )或提供 video_urls( JSON )"})
|
||||
return
|
||||
g.Log().Infof(ctx, "收到转写请求, 回调URL: %s", req.CallbackURL)
|
||||
|
||||
params := &service.CreateTaskParams{
|
||||
InputData: req.VideoURLs,
|
||||
FileNames: fileNames,
|
||||
Model: req.Model,
|
||||
Language: req.Language,
|
||||
Threshold: req.Threshold,
|
||||
CallbackURL: req.CallbackURL,
|
||||
}
|
||||
|
||||
results := service.VideoTranscribe.TranscribeUpload(ctx, savePaths,
|
||||
r.Get("model", g.Cfg().MustGet(ctx, "whisper.model", "medium").String()).String(),
|
||||
r.Get("language", g.Cfg().MustGet(ctx, "whisper.language", "zh").String()).String(),
|
||||
r.Get("threshold", 0.3).Float64())
|
||||
|
||||
r.Response.WriteJson(g.Map{"code": 200, "message": "success", "data": toSafeItems(results)})
|
||||
return service.AudioTask.Create(ctx, params)
|
||||
}
|
||||
|
||||
// toSafeItems 将结果转为安全的响应格式(移除 audioPath 等内部路径)
|
||||
func toSafeItems(results []dto.TranscribeItem) []safeItem {
|
||||
var items []safeItem
|
||||
for _, item := range results {
|
||||
si := safeItem{FileName: item.FileName, Error: item.Error}
|
||||
if item.Result != nil {
|
||||
if r, ok := item.Result.(*dto.TranscribeResult); ok {
|
||||
si.Result = &safeResult{
|
||||
Text: r.Text,
|
||||
Model: r.Model,
|
||||
Language: r.Language,
|
||||
AudioSize: r.AudioSize,
|
||||
AudioDuration: r.AudioDuration,
|
||||
Scenes: r.Scenes,
|
||||
}
|
||||
}
|
||||
}
|
||||
items = append(items, si)
|
||||
// GetTask 获取任务详情 GET /audio/task/{taskId}
|
||||
func (c *audio) GetTask(ctx context.Context, req *dto.GetTaskReq) (res *dto.GetTaskRes, err error) {
|
||||
ctx = withUser(ctx)
|
||||
return service.AudioTask.GetTask(ctx, req)
|
||||
}
|
||||
|
||||
// GetProgress 获取任务进度 GET /audio/task/{taskId}/progress
|
||||
func (c *audio) GetProgress(ctx context.Context, req *dto.GetProgressReq) (res *dto.GetProgressRes, err error) {
|
||||
ctx = withUser(ctx)
|
||||
return service.AudioTask.GetProgress(ctx, req)
|
||||
}
|
||||
|
||||
// ListTasks 获取任务列表 GET /audio/tasks
|
||||
func (c *audio) ListTasks(ctx context.Context, req *dto.ListTaskReq) (res *dto.ListTaskRes, err error) {
|
||||
ctx = withUser(ctx)
|
||||
return service.AudioTask.ListTasks(ctx, req)
|
||||
}
|
||||
|
||||
// withUser 为 context 注入默认用户(无认证基础设施时使用)
|
||||
func withUser(ctx context.Context) context.Context {
|
||||
if ctx.Value("user") == nil {
|
||||
ctx = context.WithValue(ctx, "user", &beans.User{UserName: "admin", TenantId: 1})
|
||||
}
|
||||
return items
|
||||
return ctx
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user