mirror of
https://github.com/tickstep/aliyunpan.git
synced 2025-01-24 06:52:16 +08:00
487 lines
12 KiB
Go
487 lines
12 KiB
Go
package syncdrive
|
||
|
||
import (
|
||
"context"
|
||
"fmt"
|
||
"github.com/tickstep/aliyunpan-api/aliyunpan"
|
||
"github.com/tickstep/aliyunpan/internal/utils"
|
||
"github.com/tickstep/aliyunpan/internal/waitgroup"
|
||
"github.com/tickstep/aliyunpan/library/collection"
|
||
"github.com/tickstep/library-go/logger"
|
||
"io/ioutil"
|
||
"os"
|
||
"path"
|
||
"strings"
|
||
"time"
|
||
)
|
||
|
||
type (
|
||
SyncMode string
|
||
|
||
// SyncTask 同步任务
|
||
SyncTask struct {
|
||
// Name 任务名称
|
||
Name string `json:"name"`
|
||
// Id 任务ID
|
||
Id string `json:"id"`
|
||
// DriveId 网盘ID,目前支持文件网盘
|
||
DriveId string `json:"-"`
|
||
// LocalFolderPath 本地目录
|
||
LocalFolderPath string `json:"localFolderPath"`
|
||
// PanFolderPath 云盘目录
|
||
PanFolderPath string `json:"panFolderPath"`
|
||
// Mode 同步模式
|
||
Mode SyncMode `json:"mode"`
|
||
// LastSyncTime 上一次同步时间
|
||
LastSyncTime string `json:"lastSyncTime"`
|
||
|
||
syncDbFolderPath string
|
||
localFileDb LocalSyncDb
|
||
panFileDb PanSyncDb
|
||
syncFileDb SyncFileDb
|
||
|
||
wg *waitgroup.WaitGroup
|
||
ctx context.Context
|
||
cancelFunc context.CancelFunc
|
||
|
||
panClient *aliyunpan.PanClient
|
||
|
||
fileDownloadParallel int
|
||
fileUploadParallel int
|
||
fileDownloadBlockSize int64
|
||
fileUploadBlockSize int64
|
||
useInternalUrl bool
|
||
|
||
fileActionTaskManager *FileActionTaskManager
|
||
}
|
||
)
|
||
|
||
const (
|
||
// UploadOnly 单向上传,即备份本地文件到云盘
|
||
UploadOnly SyncMode = "upload"
|
||
// DownloadOnly 只下载,即备份云盘文件到本地
|
||
DownloadOnly SyncMode = "download"
|
||
// SyncTwoWay 双向同步,本地和云盘文件完全保持一致
|
||
SyncTwoWay SyncMode = "sync"
|
||
)
|
||
|
||
func (t *SyncTask) NameLabel() string {
|
||
return t.Name + "(" + t.Id + ")"
|
||
}
|
||
|
||
func (t *SyncTask) String() string {
|
||
builder := &strings.Builder{}
|
||
builder.WriteString("任务: " + t.NameLabel() + "\n")
|
||
mode := "双向备份"
|
||
if t.Mode == UploadOnly {
|
||
mode = "备份本地文件(只上传)"
|
||
}
|
||
if t.Mode == DownloadOnly {
|
||
mode = "备份云盘文件(只下载)"
|
||
}
|
||
builder.WriteString("同步模式: " + mode + "\n")
|
||
builder.WriteString("本地目录: " + t.LocalFolderPath + "\n")
|
||
builder.WriteString("云盘目录: " + t.PanFolderPath + "\n")
|
||
return builder.String()
|
||
}
|
||
|
||
func (t *SyncTask) setupDb() error {
|
||
t.localFileDb = NewLocalSyncDb(t.localSyncDbFullPath())
|
||
t.panFileDb = NewPanSyncDb(t.panSyncDbFullPath())
|
||
t.syncFileDb = NewSyncFileDb(t.syncFileDbFullPath())
|
||
if _, e := t.localFileDb.Open(); e != nil {
|
||
return e
|
||
}
|
||
if _, e := t.panFileDb.Open(); e != nil {
|
||
return e
|
||
}
|
||
if _, e := t.syncFileDb.Open(); e != nil {
|
||
return e
|
||
}
|
||
return nil
|
||
}
|
||
|
||
// Start 启动同步任务
|
||
// 扫描本地和云盘文件信息并存储到本地数据库
|
||
func (t *SyncTask) Start() error {
|
||
if t.ctx != nil {
|
||
return fmt.Errorf("task have starting")
|
||
}
|
||
t.setupDb()
|
||
|
||
if t.fileActionTaskManager == nil {
|
||
t.fileActionTaskManager = NewFileActionTaskManager(t)
|
||
}
|
||
|
||
t.wg = waitgroup.NewWaitGroup(0)
|
||
|
||
var cancel context.CancelFunc
|
||
t.ctx, cancel = context.WithCancel(context.Background())
|
||
t.cancelFunc = cancel
|
||
|
||
go t.scanLocalFile(t.ctx)
|
||
go t.scanPanFile(t.ctx)
|
||
|
||
// start file sync manager
|
||
if e := t.fileActionTaskManager.Start(); e != nil {
|
||
return e
|
||
}
|
||
return nil
|
||
}
|
||
|
||
// Stop 停止同步任务
|
||
func (t *SyncTask) Stop() error {
|
||
if t.ctx == nil {
|
||
return nil
|
||
}
|
||
// cancel all sub task & process
|
||
t.cancelFunc()
|
||
|
||
// wait for finished
|
||
t.wg.Wait()
|
||
|
||
t.ctx = nil
|
||
t.cancelFunc = nil
|
||
|
||
// stop file action task (block routine)
|
||
t.fileActionTaskManager.Stop()
|
||
|
||
// release resources
|
||
if t.localFileDb != nil {
|
||
t.localFileDb.Close()
|
||
}
|
||
if t.panFileDb != nil {
|
||
t.panFileDb.Close()
|
||
}
|
||
if t.syncFileDb != nil {
|
||
t.syncFileDb.Close()
|
||
}
|
||
|
||
// record the sync time
|
||
t.LastSyncTime = utils.NowTimeStr()
|
||
return nil
|
||
}
|
||
|
||
// panSyncDbFullPath 云盘文件数据库
|
||
func (t *SyncTask) panSyncDbFullPath() string {
|
||
dir := path.Join(t.syncDbFolderPath, t.Id)
|
||
if b, _ := utils.PathExists(dir); !b {
|
||
os.MkdirAll(dir, 0600)
|
||
}
|
||
return path.Join(dir, "pan.bolt")
|
||
}
|
||
|
||
// localSyncDbFullPath 本地文件数据库
|
||
func (t *SyncTask) localSyncDbFullPath() string {
|
||
dir := path.Join(t.syncDbFolderPath, t.Id)
|
||
if b, _ := utils.PathExists(dir); !b {
|
||
os.MkdirAll(dir, 0600)
|
||
}
|
||
return path.Join(dir, "local.bolt")
|
||
}
|
||
|
||
// syncFileDbFullPath 同步文件过程数据库
|
||
func (t *SyncTask) syncFileDbFullPath() string {
|
||
dir := path.Join(t.syncDbFolderPath, t.Id)
|
||
if b, _ := utils.PathExists(dir); !b {
|
||
os.MkdirAll(dir, 0600)
|
||
}
|
||
return path.Join(dir, "sync.bolt")
|
||
}
|
||
|
||
func newLocalFileItem(file os.FileInfo, fullPath string) *LocalFileItem {
|
||
ft := "file"
|
||
if file.IsDir() {
|
||
ft = "folder"
|
||
}
|
||
return &LocalFileItem{
|
||
FileName: file.Name(),
|
||
FileSize: file.Size(),
|
||
FileType: ft,
|
||
CreatedAt: file.ModTime().Format("2006-01-02 15:04:05"),
|
||
UpdatedAt: file.ModTime().Format("2006-01-02 15:04:05"),
|
||
FileExtension: path.Ext(file.Name()),
|
||
Sha1Hash: "",
|
||
Path: fullPath,
|
||
ScanTimeAt: utils.NowTimeStr(),
|
||
ScanStatus: ScanStatusNormal,
|
||
}
|
||
}
|
||
|
||
// discardLocalFileDb 清理本地数据库中无效的数据项
|
||
func (t *SyncTask) discardLocalFileDb(filePath string, startTimeUnix int64) {
|
||
files, e := t.localFileDb.GetFileList(filePath)
|
||
if e != nil {
|
||
return
|
||
}
|
||
for _, file := range files {
|
||
if file.ScanTimeAt == "" || file.ScanTimeUnix() < startTimeUnix {
|
||
// label file discard
|
||
file.ScanStatus = ScanStatusDiscard
|
||
t.localFileDb.Update(file)
|
||
} else {
|
||
if file.IsFolder() {
|
||
t.discardLocalFileDb(file.Path, startTimeUnix)
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
// scanLocalFile 本地文件循环扫描进程
|
||
func (t *SyncTask) scanLocalFile(ctx context.Context) {
|
||
type folderItem struct {
|
||
fileInfo os.FileInfo
|
||
path string
|
||
}
|
||
|
||
// init the root folders info
|
||
pathParts := strings.Split(strings.ReplaceAll(t.LocalFolderPath, "\\", "/"), "/")
|
||
fullPath := ""
|
||
for _, p := range pathParts {
|
||
if p == "" {
|
||
continue
|
||
}
|
||
if strings.Contains(p, ":") {
|
||
// windows volume label, e.g: C:/ D:/
|
||
fullPath += p
|
||
continue
|
||
}
|
||
fullPath += "/" + p
|
||
fi, err := os.Stat(fullPath)
|
||
if err != nil {
|
||
// may be permission deny
|
||
continue
|
||
}
|
||
t.localFileDb.Add(newLocalFileItem(fi, fullPath))
|
||
}
|
||
|
||
folderQueue := collection.NewFifoQueue()
|
||
rootFolder, err := os.Stat(t.LocalFolderPath)
|
||
if err != nil {
|
||
return
|
||
}
|
||
folderQueue.Push(&folderItem{
|
||
fileInfo: rootFolder,
|
||
path: t.LocalFolderPath,
|
||
})
|
||
startTimeOfThisLoop := time.Now().Unix()
|
||
delayTimeCount := int64(0)
|
||
|
||
t.wg.AddDelta()
|
||
defer t.wg.Done()
|
||
for {
|
||
select {
|
||
case <-ctx.Done():
|
||
// cancel routine & done
|
||
logger.Verboseln("local file routine done")
|
||
return
|
||
default:
|
||
// 采用广度优先遍历(BFS)进行文件遍历
|
||
if delayTimeCount > 0 {
|
||
time.Sleep(1 * time.Second)
|
||
delayTimeCount -= 1
|
||
continue
|
||
} else if delayTimeCount == 0 {
|
||
delayTimeCount -= 1
|
||
startTimeOfThisLoop = time.Now().Unix()
|
||
logger.Verboseln("do scan local file process at ", utils.NowTimeStr())
|
||
}
|
||
obj := folderQueue.Pop()
|
||
if obj == nil {
|
||
// label discard file from DB
|
||
t.discardLocalFileDb(t.LocalFolderPath, startTimeOfThisLoop)
|
||
|
||
// restart scan loop over again
|
||
folderQueue.Push(&folderItem{
|
||
fileInfo: rootFolder,
|
||
path: t.LocalFolderPath,
|
||
})
|
||
delayTimeCount = TimeSecondsOfOneMinute
|
||
continue
|
||
}
|
||
item := obj.(*folderItem)
|
||
files, err := ioutil.ReadDir(item.path)
|
||
if err != nil {
|
||
continue
|
||
}
|
||
if len(files) == 0 {
|
||
continue
|
||
}
|
||
localFileAppendList := LocalFileList{}
|
||
for _, file := range files {
|
||
if strings.HasSuffix(file.Name(), DownloadingFileSuffix) {
|
||
// 下载中文件,跳过
|
||
continue
|
||
}
|
||
|
||
localFile := newLocalFileItem(file, item.path+"/"+file.Name())
|
||
localFileInDb, _ := t.localFileDb.Get(localFile.Path)
|
||
if localFileInDb == nil {
|
||
// append
|
||
localFile.ScanTimeAt = utils.NowTimeStr()
|
||
localFileAppendList = append(localFileAppendList, localFile)
|
||
} else {
|
||
// update newest info into DB
|
||
if localFile.UpdateTimeUnix() > localFileInDb.UpdateTimeUnix() {
|
||
localFileInDb.Sha1Hash = ""
|
||
}
|
||
localFileInDb.UpdatedAt = localFile.UpdatedAt
|
||
localFileInDb.CreatedAt = localFile.CreatedAt
|
||
localFileInDb.FileSize = localFile.FileSize
|
||
localFileInDb.FileType = localFile.FileType
|
||
localFileInDb.ScanTimeAt = utils.NowTimeStr()
|
||
localFileInDb.ScanStatus = ScanStatusNormal
|
||
if _, er := t.localFileDb.Update(localFileInDb); er != nil {
|
||
logger.Verboseln("local db update error ", er)
|
||
}
|
||
}
|
||
|
||
// for next term scan
|
||
if file.IsDir() {
|
||
folderQueue.Push(&folderItem{
|
||
fileInfo: file,
|
||
path: item.path + "/" + file.Name(),
|
||
})
|
||
}
|
||
}
|
||
|
||
if len(localFileAppendList) > 0 {
|
||
//fmt.Println(utils.ObjectToJsonStr(localFileAppendList))
|
||
if _, er := t.localFileDb.AddFileList(localFileAppendList); er != nil {
|
||
logger.Verboseln("add files to local file db error {}", er)
|
||
}
|
||
}
|
||
time.Sleep(500 * time.Millisecond)
|
||
}
|
||
}
|
||
}
|
||
|
||
// discardPanFileDb 清理云盘数据库中无效的数据项
|
||
func (t *SyncTask) discardPanFileDb(filePath string, startTimeUnix int64) {
|
||
files, e := t.panFileDb.GetFileList(filePath)
|
||
if e != nil {
|
||
return
|
||
}
|
||
for _, file := range files {
|
||
if file.ScanTimeUnix() < startTimeUnix {
|
||
// label file discard
|
||
file.ScanStatus = ScanStatusDiscard
|
||
t.panFileDb.Update(file)
|
||
} else {
|
||
if file.IsFolder() {
|
||
t.discardPanFileDb(file.Path, startTimeUnix)
|
||
}
|
||
}
|
||
}
|
||
}
|
||
|
||
// scanPanFile 云盘文件循环扫描进程
|
||
func (t *SyncTask) scanPanFile(ctx context.Context) {
|
||
// init the root folders info
|
||
pathParts := strings.Split(strings.ReplaceAll(t.PanFolderPath, "\\", "/"), "/")
|
||
fullPath := ""
|
||
for _, p := range pathParts {
|
||
if p == "" {
|
||
continue
|
||
}
|
||
fullPath += "/" + p
|
||
fi, err := t.panClient.FileInfoByPath(t.DriveId, fullPath)
|
||
if err != nil {
|
||
return
|
||
}
|
||
pFile := NewPanFileItem(fi)
|
||
pFile.ScanTimeAt = utils.NowTimeStr()
|
||
t.panFileDb.Add(pFile)
|
||
time.Sleep(200 * time.Millisecond)
|
||
}
|
||
|
||
folderQueue := collection.NewFifoQueue()
|
||
rootPanFile, err := t.panClient.FileInfoByPath(t.DriveId, t.PanFolderPath)
|
||
if err != nil {
|
||
return
|
||
}
|
||
folderQueue.Push(rootPanFile)
|
||
startTimeOfThisLoop := time.Now().Unix()
|
||
delayTimeCount := int64(0)
|
||
|
||
t.wg.AddDelta()
|
||
defer t.wg.Done()
|
||
for {
|
||
select {
|
||
case <-ctx.Done():
|
||
// cancel routine & done
|
||
logger.Verboseln("pan file routine done")
|
||
return
|
||
default:
|
||
// 采用广度优先遍历(BFS)进行文件遍历
|
||
if delayTimeCount > 0 {
|
||
time.Sleep(1 * time.Second)
|
||
delayTimeCount -= 1
|
||
continue
|
||
} else if delayTimeCount == 0 {
|
||
delayTimeCount -= 1
|
||
startTimeOfThisLoop = time.Now().Unix()
|
||
logger.Verboseln("do scan pan file process at ", utils.NowTimeStr())
|
||
}
|
||
obj := folderQueue.Pop()
|
||
if obj == nil {
|
||
// label discard file from DB
|
||
t.discardPanFileDb(t.PanFolderPath, startTimeOfThisLoop)
|
||
|
||
// restart scan loop over again
|
||
folderQueue.Push(rootPanFile)
|
||
delayTimeCount = TimeSecondsOf5Minute
|
||
continue
|
||
}
|
||
item := obj.(*aliyunpan.FileEntity)
|
||
// TODO: check to decide to sync file info or to await
|
||
files, err := t.panClient.FileListGetAll(&aliyunpan.FileListParam{
|
||
DriveId: t.DriveId,
|
||
ParentFileId: item.FileId,
|
||
})
|
||
if err != nil {
|
||
// retry next term
|
||
folderQueue.Push(item)
|
||
time.Sleep(10 * time.Second)
|
||
continue
|
||
}
|
||
panFileList := PanFileList{}
|
||
for _, file := range files {
|
||
file.Path = path.Join(item.Path, file.FileName)
|
||
//fmt.Println(utils.ObjectToJsonStr(file, true))
|
||
panFileInDb, _ := t.panFileDb.Get(file.Path)
|
||
if panFileInDb == nil {
|
||
// append
|
||
pFile := NewPanFileItem(file)
|
||
pFile.ScanTimeAt = utils.NowTimeStr()
|
||
panFileList = append(panFileList, pFile)
|
||
} else {
|
||
// update newest info into DB
|
||
panFileInDb.DomainId = file.DomainId
|
||
panFileInDb.FileId = file.FileId
|
||
panFileInDb.FileType = file.FileType
|
||
panFileInDb.Category = file.Category
|
||
panFileInDb.Crc64Hash = file.Crc64Hash
|
||
panFileInDb.Sha1Hash = file.ContentHash
|
||
panFileInDb.FileSize = file.FileSize
|
||
panFileInDb.UpdatedAt = file.UpdatedAt
|
||
panFileInDb.CreatedAt = file.CreatedAt
|
||
panFileInDb.ScanTimeAt = utils.NowTimeStr()
|
||
panFileInDb.ScanStatus = ScanStatusNormal
|
||
t.panFileDb.Update(panFileInDb)
|
||
}
|
||
|
||
if file.IsFolder() {
|
||
folderQueue.Push(file)
|
||
}
|
||
}
|
||
if len(panFileList) > 0 {
|
||
if _, er := t.panFileDb.AddFileList(panFileList); er != nil {
|
||
logger.Verboseln("add files to pan file db error {}", er)
|
||
}
|
||
}
|
||
time.Sleep(10 * time.Second) // 延迟避免触发风控
|
||
}
|
||
}
|
||
}
|