添加协程管理功能，支持优雅关闭和并发控制

2025-12-24 17:54:18 +08:00 · 2025-12-24 17:54:18 +08:00 · 2e6e665984
parent cb60c605e3
commit 2e6e665984
11 changed files with 374 additions and 24 deletions
--- a/attachment/uploader.go
+++ b/attachment/uploader.go
@ -1,4 +1,4 @@
-package l_export_async
+package attachment

 import (
 	"bytes"
--- a/coroutine/README.md
+++ b/coroutine/README.md
@ -0,0 +1,50 @@
+# 协程启动管理器
+目前的主要作用是：
+   1. 简化写法，不用自己再defer记录日志
+   2. 优雅关闭
+   3. 统一管理方便后面扩展
+   4. 支持固定队列协程：定义最大数量，超过时会阻塞启动，直接有空闲的时候才会启动
+
+todolist:
+* [ ]. 控coroutine的状态：数量，时长
+
+## 使用步骤
+1. 交给kratos管理生命周期
+   ```go
+   // 1. 打开main.go
+   // 2. newApp方法中注入logHelper *log.Helper
+   // 3. 按如下代码提供给kratos管理生命周期
+   coroutineServer := coroutine.NewServer(logHelper)
+   serverOption := kratos.Server(
+     // 省略之前的一些已有变量...
+     coroutineServer,
+   ) 
+   ```
+   
+2. 使用示例
+   ```go
+   doDesc := "我是闭包中能访问到的变量，可以直接使用"
+   coroutine.Run("我是任务名称", func() {
+       // 模拟执行
+       fmt.Printf("开始：%s\n", doDesc)
+       time.Sleep(1 * time.Second)
+       fmt.Printf("开始：%s\n", doDesc)
+   })   
+   // 在Run里面会开启协程，不要自己在这里使用go关键字开启协程
+   // 错误示例：go coroutine.Run("我是任务名称", func() {})
+   ```
+
+3固定队列使用示例  
+   ```go
+   maxTaskCnt := 10 // 最大并行任务数量。超过时阻塞启动方，直到有有任务执行完成
+   f := NewFixed(maxTaskCnt)
+   doDesc := "我是闭包中能访问到的变量，可以直接使用"
+   f.Run("我是任务名称", func() {
+      // 模拟执行
+      fmt.Printf("开始：%s\n", doDesc)
+      time.Sleep(1 * time.Second)
+      fmt.Printf("开始：%s\n", doDesc)
+   })
+   // 在Run里面会开启协程，不要自己在这里使用go关键字开启协程
+   // 错误示例：go coroutine.Run("我是任务名称", func() {})
+   ```
--- a/coroutine/fixed.go
+++ b/coroutine/fixed.go
@ -0,0 +1,23 @@
+package coroutine
+
+type Fixed struct {
+	queues chan struct{}
+}
+
+func NewFixed(count int) *Fixed {
+	return &Fixed{
+		queues: make(chan struct{}, count),
+	}
+}
+
+// Run 运行指定函数
+// name 协程名称
+// fn 协程执行的函数
+func (f *Fixed) Run(name string, fn func()) {
+	f.queues <- struct{}{}
+	runAfter(name, fn, func() {
+		<-f.queues
+	})
+}
+
+// chan 的发送次数 >= 接收次数，可以不用close，由GC回收
--- a/coroutine/fixed_test.go
+++ b/coroutine/fixed_test.go
@ -0,0 +1,64 @@
+package coroutine
+
+import (
+	"fmt"
+	"testing"
+	"time"
+)
+
+func TestFixed_Run(t *testing.T) {
+	tests := []struct {
+		name            string
+		count           int
+		taskCnt         int
+		expectedMinMill time.Duration
+		expectedMaxMill time.Duration
+	}{
+		{
+			name:            "超过时阻塞 100ms",
+			count:           1,
+			taskCnt:         2,
+			expectedMinMill: 100 * time.Millisecond,
+		},
+		{
+			name:            "超过时阻塞 200ms",
+			count:           1,
+			taskCnt:         3,
+			expectedMinMill: 200 * time.Millisecond,
+		},
+		{
+			name:            "相等限制时不阻塞",
+			count:           3,
+			taskCnt:         3,
+			expectedMaxMill: 10 * time.Millisecond,
+		},
+		{
+			name:            "低于限制时不阻塞",
+			count:           4,
+			taskCnt:         3,
+			expectedMaxMill: 10 * time.Millisecond,
+		},
+	}
+	for _, tt := range tests {
+		t.Run(tt.name, func(t *testing.T) {
+			f := NewFixed(tt.count)
+			start := time.Now()
+
+			for i := 0; i < tt.taskCnt; i++ {
+				f.Run("test", func() {
+					time.Sleep(100 * time.Millisecond)
+				})
+			}
+
+			end := time.Now()
+			milliseconds := end.Sub(start).Milliseconds()
+			if tt.expectedMinMill > 0 && milliseconds < tt.expectedMinMill.Milliseconds() {
+				t.Errorf("运行时长最少 %d ms, 实际 %d ms", tt.expectedMinMill, milliseconds)
+			}
+			if tt.expectedMaxMill > 0 && milliseconds > tt.expectedMaxMill.Milliseconds() {
+				t.Errorf("运行时长不超过 %d ms, 实际 %d ms", tt.expectedMaxMill, milliseconds)
+			}
+			fmt.Println(milliseconds)
+		})
+	}
+}
--- a/coroutine/server.go
+++ b/coroutine/server.go
@ -0,0 +1,73 @@
+package coroutine
+
+import (
+	"context"
+	"fmt"
+	"gitea.cdlsxd.cn/self-tools/l-export-async/util"
+	"time"
+)
+
+// Server 管理协程
+// 提供给kratos当server使用，主要实现其start和stop，交给kratos管理其生命周期
+type Server struct {
+	// 关闭时最长等待时长
+	timeout time.Duration
+}
+
+type ServerOption func(s *Server)
+
+func WithServerTimeout(timeout time.Duration) ServerOption {
+	return func(s *Server) {
+		s.timeout = timeout
+	}
+}
+
+// NewServer 创建一个协程管理器
+// log 日志
+// timeout 关闭时最长等待时长
+func NewServer(log util.Logger, opts ...ServerOption) *Server {
+	globalLogger = log
+	s := &Server{
+		timeout: 24 * time.Hour, //默认最多等待24个小时
+	}
+	for _, opt := range opts {
+		opt(s)
+	}
+	return s
+}
+
+func (s *Server) Start(ctx context.Context) error {
+	return nil
+}
+
+func (s *Server) Stop(ctx context.Context) error {
+	myCtx, cancel := context.WithTimeout(context.Background(), s.timeout)
+	defer cancel()
+
+	// 每1s检查下业务是否都处理完成
+	ticker := time.NewTicker(1 * time.Second)
+	defer ticker.Stop()
+
+	for {
+		tasks := getTasks()
+		if len(tasks) == 0 {
+			fmt.Println("协程任务已全部优雅退出")
+			return nil
+		}
+		processStatusMsg := ""
+		for _, t := range tasks {
+			if processStatusMsg != "" {
+				processStatusMsg += "、"
+			}
+			processStatusMsg += t.name
+		}
+		fmt.Printf("等待协程任务退出，当前活动：%d 个：%s \n", len(tasks), processStatusMsg)
+		select {
+		case <-myCtx.Done():
+			//超时退出
+			err := fmt.Errorf("等待协程任务超时，即将退出")
+			return err
+		case <-ticker.C:
+		}
+	}
+}
--- a/coroutine/task.go
+++ b/coroutine/task.go
@ -0,0 +1,87 @@
+package coroutine
+
+import (
+	"fmt"
+	"gitea.cdlsxd.cn/self-tools/l-export-async/util"
+	"sync"
+)
+
+var activeTaskMu sync.Mutex
+var activeTask = make(map[*task]struct{})
+var globalLogger util.Logger
+
+type task struct {
+	name string
+	fn   func()
+}
+
+// addTask 添加任务
+func addTask(t *task) {
+	activeTaskMu.Lock()
+	defer activeTaskMu.Unlock()
+	activeTask[t] = struct{}{}
+}
+
+// removeTask 删除任务
+func removeTask(t *task) {
+	activeTaskMu.Lock()
+	defer activeTaskMu.Unlock()
+	delete(activeTask, t)
+}
+
+// getTaskSize 获取任务数量
+// nolint
+func getTaskSize() int {
+	activeTaskMu.Lock()
+	defer activeTaskMu.Unlock()
+	return len(activeTask)
+}
+
+// getTaskSize 获取任务数量
+func getTasks() []*task {
+	activeTaskMu.Lock()
+	defer activeTaskMu.Unlock()
+
+	tasks := make([]*task, 0, len(activeTask))
+	for t := range activeTask {
+		tasks = append(tasks, t)
+	}
+	return tasks
+}
+
+// Run 运行指定函数
+// name 协程名称
+// fn 协程执行的函数
+func Run(name string, fn func()) {
+	runAfter(name, fn, func() {})
+}
+
+// Run 运行指定函数
+// name 协程名称
+// fn 协程执行的函数
+func runAfter(name string, fn func(), afterFn func()) {
+	t := &task{name: name, fn: fn}
+	addTask(t)
+
+	go func() {
+		// 删除任务
+		defer removeTask(t)
+
+		// 记录panic错误
+		defer func() {
+			if r := recover(); r != nil {
+				if globalLogger != nil {
+					globalLogger.Errorf("coroutine %s panic：%+v", t.name, r)
+				} else {
+					fmt.Printf("coroutine %s panic：%+v", t.name, r)
+				}
+			}
+		}()
+
+		// 完毕后要执行的函数
+		defer afterFn()
+
+		// 运行指定函数
+		t.fn()
+	}()
+}
--- a/coroutine/task_test.go
+++ b/coroutine/task_test.go
@ -0,0 +1,41 @@
+package coroutine
+
+import (
+	"context"
+	"fmt"
+	"testing"
+	"time"
+)
+
+func TestRun(t *testing.T) {
+	// 测试未超时情况
+	fmt.Println("-----测试超时情况------")
+	for i := 0; i < 5; i++ {
+		ii := i
+		name := fmt.Sprintf("测试任务%d", i)
+		Run(name, func() {
+			fmt.Printf("%s开始\n", name)
+			w := time.Second * time.Duration(ii)
+			time.Sleep(w)
+			fmt.Printf("%s完成\n", name)
+		})
+	}
+	err := NewServer(nil, WithServerTimeout(2*time.Second)).Stop(context.Background())
+	fmt.Println(err)
+
+	// 测试超时情况
+	fmt.Println("\n-----测试未超时情况------")
+	for i := 0; i < 5; i++ {
+		ii := i
+		name := fmt.Sprintf("测试任务%d", ii)
+		Run(name, func() {
+			fmt.Printf("%s开始\n", name)
+			w := time.Second * time.Duration(ii)
+			time.Sleep(w)
+			fmt.Printf("%s完成\n", name)
+		})
+	}
+	err = NewServer(nil).Stop(context.Background())
+	fmt.Println(err)
+
+}
--- a/export_async.go
+++ b/export_async.go
@ -6,11 +6,16 @@ import (
 	"encoding/base64"
 	"encoding/csv"
 	"encoding/json"
-	"finance/internal/pkg/helper/attachment"
+	"errors"
 	"fmt"
 	"strconv"
 	"strings"

+	"gitea.cdlsxd.cn/self-tools/l-export-async/attachment"
+	"gitea.cdlsxd.cn/self-tools/l-export-async/coroutine"
+	"github.com/google/uuid"
+	"github.com/redis/go-redis/v9"
+	"golang.org/x/sync/errgroup"
 	"io"
 	"os"
 	"path/filepath"
@ -18,10 +23,6 @@ import (
 	"sync"
 	"sync/atomic"
 	"time"
-
-	attachmentsdk "codeup.aliyun.com/5f9118049cffa29cfdd3be1c/attachment-sdk"
-	"github.com/google/uuid"
-	"golang.org/x/sync/errgroup"
 )

 var exportAsyncPool = &sync.Pool{
@ -50,7 +51,7 @@ var (
 	DefaultMaxRowPerFile   = 100000 ////每个Xlsx的行数，默认10000行->WithMaxRowPerFile
 	DefaultCsvToExcelBatch = 1000   ////csv转excel的批量写入缓冲区大小,逐行写入设置为1000->WithCustomBufferSize
 	DefaultWorkNum         = 1      // 并发协程数（务必大于1）,默认runtime.NumCPU() * 2->WithCustomWorkNum
-	ProcessLimit           = 1      //全局并行导出任务上限
+	ProcessLimit           = 1000   //全局并行导出任务上限
 	DefaultUploader        = &Uploader{
 		FieldFormName: "file",
 		System:        "crmApi",
@ -141,8 +142,7 @@ func (e *ExportAsync) Run(ctx context.Context) (string, error) {
 	if err != nil {
 		return "", fmt.Errorf("创建任务失败: %v", err)
 	}
-
-	go func() {
+	coroutine.Run(fmt.Sprintf("创建任务导出任务：%s", e.fileName), func() {
 		// 执行导出任务
 		subCtx, cancel := context.WithCancel(context.Background())
 		defer func() {
@ -162,7 +162,8 @@ func (e *ExportAsync) Run(ctx context.Context) (string, error) {
 		}
 		e.logTool.Infof("异步导出任务：%s,导出完成,总计导出%d条数据,下载地址：%s", e.task.Id, e.task.RowCount, source)

-	}()
+	})
+
 	return e.task.Id, nil
 }

@ -318,7 +319,7 @@ func (e *ExportAsync) upload(file string) (string, error) {
 	if err != nil {
 		return "", err
 	}
-	return attachmentsdk.GeneratePreviewPrivateUrl(e.uploader.Host, "", resp.Url, "", strings.TrimSuffix(e.fileName, ".zip"), time.Now().Unix()+300), nil
+	return attachment.GeneratePreviewPrivateUrl(e.uploader.Host, "", resp.Url, "", strings.TrimSuffix(e.fileName, ".zip"), time.Now().Unix()+300), nil
 }

 func (e *ExportAsync) folderToZip(excelsDir, zipFilePath string) error {
@ -534,10 +535,6 @@ func (e *ExportAsync) processTimeShard(ctx context.Context, tempDir string, work
 			// 如果本次获取的数据不足limit，说明这个时间段的数据已经取完
 			currentTime = queryEndTime
 		} else {
-			// 如果数据量等于limit，可能还有更多数据
-			// 这里可以根据业务逻辑决定是否移动时间
-			// 例如：如果数据是按时间排序的，可以取最后一条数据的时间作为下一次查询的起始时间
-			// 为了简化，我们还是按固定时间片移动
 			currentTime = queryEndTime
 		}

@ -639,12 +636,10 @@ func (e *ExportAsync) CheckAndIncrementTaskCount(ctx context.Context, key string
 	if err != nil {
 		return fmt.Errorf("获取%s数量失败: %w", limitType, err)
 	}
-
 	if count >= limit {
 		return fmt.Errorf("%s %s数量已达上限（%d），请稍后重试", e.fileName, limitType, limit)
 	}
-
-	if _err := e.taskSaveTool.Set(ctx, key, strconv.Itoa(count+1), 0).Err(); _err != nil {
+	if _err := e.taskSaveTool.Set(ctx, key, strconv.Itoa(count+1), 10*time.Minute).Err(); _err != nil {
 		e.taskSaveTool.Del(ctx, key)
 		return fmt.Errorf("更新任务数量失败: %w", err)
 	}
@ -653,9 +648,13 @@ func (e *ExportAsync) CheckAndIncrementTaskCount(ctx context.Context, key string

 func (e *ExportAsync) getAndParseTaskCount(ctx context.Context, key string) (int, error) {
 	res := e.taskSaveTool.Get(ctx, key)
-	if res.Val() == "" {
+	if errors.Is(res.Err(), redis.Nil) {
 		return 0, nil
 	}
+	if res.Err() != nil {
+		return 0, fmt.Errorf("获取任务数量失败: %w", res.Err())
+	}
+
 	count, err := strconv.Atoi(res.Val())
 	if err != nil {
 		return 0, fmt.Errorf("解析任务数量失败: %w", err)
@ -685,7 +684,6 @@ func (e *ExportAsync) updateTask(ctx context.Context) (err error) {
 }

 func (e *ExportAsync) processAdd(ctx context.Context, addNum int32) {
-
 	atomic.AddInt32(&e.task.Process, addNum)
 	e.logTool.Infof("异步导出任务：%s,当前进度：%d", e.task.Id, e.task.Process)
 	_ = e.updateTask(ctx)
@ -763,7 +761,7 @@ func (e *ExportAsync) release() {
 	e.batchSize = DefaultBatch
 	e.maxRowPerFile = DefaultMaxRowPerFile
 	e.csvToExcelBatch = DefaultCsvToExcelBatch
-	e.task = nil
+	e.task = &Task{}
 	e.workerNum = DefaultWorkNum
 	e.uploader = DefaultUploader
 	e.logTool = NewLogPrint(nil)
--- a/merge.go
+++ b/merge.go
@ -3,12 +3,11 @@ package l_export_async
 import (
 	"encoding/csv"
 	"fmt"
+	"github.com/xuri/excelize/v2"
 	"io"
 	"math"
 	"os"
 	"regexp"
-
-	"github.com/xuri/excelize/v2"
 )

 type (
--- a/redis.go
+++ b/redis.go
@ -16,7 +16,7 @@ func (r *redisTaskStore) Set(ctx context.Context, key string, value interface{},
 }

 func (r *redisTaskStore) Del(ctx context.Context, keys ...string) TaskErr {
-	//实际运行中并没有去执行这个，因为不确定是否真的需要删除，如果需要可以自行写入
+
 	return r.client.Del(ctx, keys...)
 }

--- a/util/logger.go
+++ b/util/logger.go
@ -0,0 +1,15 @@
+package util
+
+type Logger interface {
+	// Debugf logs a formatted debugging message.
+	Debugf(format string, args ...interface{})
+
+	// Infof logs a formatted informational message.
+	Infof(format string, args ...interface{})
+
+	// Warnf logs a formatted warning message.
+	Warnf(format string, args ...interface{})
+
+	// Errorf logs a formatted error message.
+	Errorf(format string, args ...interface{})
+}