You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

cache.go 16 kB

8 months ago
8 months ago
8 months ago
8 months ago
8 months ago
8 months ago
8 months ago
8 months ago
8 months ago
8 months ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665
  1. package cache
  2. import (
  3. "errors"
  4. "io"
  5. "os"
  6. "path/filepath"
  7. "sync"
  8. "syscall"
  9. "time"
  10. "github.com/inhies/go-bytesize"
  11. "github.com/samber/lo"
  12. "gitlink.org.cn/cloudream/common/pkgs/logger"
  13. "gitlink.org.cn/cloudream/common/pkgs/trie"
  14. cdssdk "gitlink.org.cn/cloudream/common/sdks/storage"
  15. "gitlink.org.cn/cloudream/common/utils/io2"
  16. "gitlink.org.cn/cloudream/common/utils/lo2"
  17. "gitlink.org.cn/cloudream/storage2/client2/internal/mount/config"
  18. "gitlink.org.cn/cloudream/storage2/client2/internal/mount/fuse"
  19. "gitlink.org.cn/cloudream/storage2/common/pkgs/db2"
  20. "gitlink.org.cn/cloudream/storage2/common/pkgs/downloader"
  21. "gitlink.org.cn/cloudream/storage2/common/pkgs/uploader"
  22. )
  23. type CacheEntry interface {
  24. fuse.FsEntry
  25. // 在虚拟文件系统中的路径,即不包含缓存目录的路径
  26. PathComps() []string
  27. }
  28. type CacheEntryInfo struct {
  29. PathComps []string
  30. Size int64
  31. Mode os.FileMode
  32. ModTime time.Time
  33. IsDir bool
  34. }
  35. type Cache struct {
  36. cfg *config.Config
  37. db *db2.DB
  38. uploader *uploader.Uploader
  39. downloader *downloader.Downloader
  40. cacheDataDir string
  41. cacheMetaDir string
  42. lock *sync.RWMutex
  43. cacheDone chan any
  44. activeCache *trie.Trie[*CacheFile]
  45. }
  46. func NewCache(cfg *config.Config, db *db2.DB, uploader *uploader.Uploader, downloader *downloader.Downloader) *Cache {
  47. return &Cache{
  48. cfg: cfg,
  49. db: db,
  50. uploader: uploader,
  51. downloader: downloader,
  52. cacheDataDir: filepath.Join(cfg.CacheDir, "data"),
  53. cacheMetaDir: filepath.Join(cfg.CacheDir, "meta"),
  54. lock: &sync.RWMutex{},
  55. cacheDone: make(chan any),
  56. activeCache: trie.NewTrie[*CacheFile](),
  57. }
  58. }
  59. func (c *Cache) Start() {
  60. go c.scanningCache()
  61. }
  62. func (c *Cache) Stop() {
  63. close(c.cacheDone)
  64. }
  65. func (c *Cache) GetCacheDataPath(comps ...string) string {
  66. comps2 := make([]string, len(comps)+1)
  67. comps2[0] = c.cacheDataDir
  68. copy(comps2[1:], comps)
  69. return filepath.Join(comps2...)
  70. }
  71. func (c *Cache) GetCacheDataPathComps(comps ...string) []string {
  72. comps2 := make([]string, len(comps)+1)
  73. comps2[0] = c.cacheDataDir
  74. copy(comps2[1:], comps)
  75. return comps2
  76. }
  77. func (c *Cache) GetCacheMetaPath(comps ...string) string {
  78. comps2 := make([]string, len(comps)+1)
  79. comps2[0] = c.cacheMetaDir
  80. copy(comps2[1:], comps)
  81. return filepath.Join(comps2...)
  82. }
  83. func (c *Cache) GetCacheMetaPathComps(comps ...string) []string {
  84. comps2 := make([]string, len(comps)+1)
  85. comps2[0] = c.cacheMetaDir
  86. copy(comps2[1:], comps)
  87. return comps2
  88. }
  89. // 获取指定位置的缓存条目信息。如果路径不存在,则返回nil。
  90. func (c *Cache) Stat(pathComps []string) *CacheEntryInfo {
  91. c.lock.RLock()
  92. defer c.lock.RUnlock()
  93. node, ok := c.activeCache.WalkEnd(pathComps)
  94. if ok && node.Value != nil {
  95. info := node.Value.Info()
  96. return &info
  97. }
  98. metaPath := c.GetCacheMetaPath(pathComps...)
  99. stat, err := os.Stat(metaPath)
  100. if err != nil {
  101. // TODO 日志记录
  102. return nil
  103. }
  104. if stat.IsDir() {
  105. info, err := loadCacheDirInfo(c, pathComps)
  106. if err != nil {
  107. return nil
  108. }
  109. return info
  110. }
  111. info, err := loadCacheFileInfo(c, pathComps)
  112. if err != nil {
  113. return nil
  114. }
  115. return info
  116. }
  117. // 创建一个缓存文件。如果文件已经存在,则会覆盖已有文件。如果加载过程中发生了错误,或者目标位置是一个目录,则会返回nil。
  118. func (c *Cache) CreateFile(pathComps []string) *CacheFile {
  119. c.lock.Lock()
  120. defer c.lock.Unlock()
  121. node, ok := c.activeCache.WalkEnd(pathComps)
  122. if ok && node.Value != nil {
  123. node.Value.Delete()
  124. if node.Value.state.uploading != nil {
  125. node.Value.state.uploading.isDeleted = true
  126. }
  127. }
  128. ch, err := createNewCacheFile(c, pathComps)
  129. if err != nil {
  130. logger.Warnf("create new cache file %v: %v", pathComps, err)
  131. return nil
  132. }
  133. ch.state.refCount++
  134. c.activeCache.CreateWords(pathComps).Value = ch
  135. logger.Debugf("create new cache file %v", pathComps)
  136. return ch
  137. }
  138. // 尝试加载缓存文件,如果文件不存在,则使用obj的信息创建一个新缓存文件,而如果obj为nil,那么会返回nil。
  139. func (c *Cache) LoadFile(pathComps []string, obj *cdssdk.Object) *CacheFile {
  140. c.lock.Lock()
  141. defer c.lock.Unlock()
  142. node, ok := c.activeCache.WalkEnd(pathComps)
  143. if ok && node.Value != nil {
  144. if !node.Value.state.isLoaded {
  145. err := node.Value.Load()
  146. if err != nil {
  147. logger.Warnf("load cache %v: %v", pathComps, err)
  148. return nil
  149. }
  150. }
  151. return node.Value
  152. }
  153. ch, err := loadCacheFile(c, pathComps)
  154. if err == nil {
  155. ch.remoteObj = obj
  156. ch.state.refCount++
  157. c.activeCache.CreateWords(pathComps).Value = ch
  158. logger.Debugf("load cache %v", pathComps)
  159. return ch
  160. }
  161. if !os.IsNotExist(err) {
  162. // TODO 日志记录
  163. logger.Warnf("load cache %v: %v", pathComps, err)
  164. return nil
  165. }
  166. if obj == nil {
  167. return nil
  168. }
  169. ch, err = newCacheFileFromObject(c, pathComps, obj)
  170. if err != nil {
  171. logger.Warnf("create cache %v from object: %v", pathComps, err)
  172. return nil
  173. }
  174. ch.state.refCount++
  175. c.activeCache.CreateWords(pathComps).Value = ch
  176. logger.Debugf("create cache %v from object %v", pathComps, obj.ObjectID)
  177. return ch
  178. }
  179. // 创建一个缓存目录。如果目录已经存在,则会重置目录属性。如果加载过程中发生了错误,或者目标位置是一个文件,则会返回nil
  180. func (c *Cache) CreateDir(pathComps []string) *CacheDir {
  181. c.lock.Lock()
  182. defer c.lock.Unlock()
  183. ch, err := createNewCacheDir(c, pathComps)
  184. if err != nil {
  185. logger.Warnf("create cache dir: %v", err)
  186. return nil
  187. }
  188. return ch
  189. }
  190. type CreateDirOption struct {
  191. ModTime time.Time
  192. }
  193. // 加载指定缓存目录,如果目录不存在,则使用createOpt选项创建目录,而如果createOpt为nil,那么会返回nil。
  194. func (c *Cache) LoadDir(pathComps []string, createOpt *CreateDirOption) *CacheDir {
  195. c.lock.Lock()
  196. defer c.lock.Unlock()
  197. ch, err := loadCacheDir(c, pathComps)
  198. if err == nil {
  199. return ch
  200. }
  201. if !os.IsNotExist(err) {
  202. // TODO 日志记录
  203. return nil
  204. }
  205. if createOpt == nil {
  206. return nil
  207. }
  208. // 创建目录
  209. ch, err = makeCacheDirFromOption(c, pathComps, *createOpt)
  210. if err != nil {
  211. // TODO 日志记录
  212. return nil
  213. }
  214. return ch
  215. }
  216. // 加载指定路径下的所有缓存条目信息
  217. func (c *Cache) StatMany(pathComps []string) []CacheEntryInfo {
  218. c.lock.RLock()
  219. defer c.lock.RUnlock()
  220. var infos []CacheEntryInfo
  221. exists := make(map[string]bool)
  222. node, ok := c.activeCache.WalkEnd(pathComps)
  223. if ok {
  224. for name, child := range node.WordNexts {
  225. if child.Value != nil {
  226. infos = append(infos, child.Value.Info())
  227. exists[name] = true
  228. }
  229. }
  230. }
  231. osEns, err := os.ReadDir(c.GetCacheMetaPath(pathComps...))
  232. if err != nil {
  233. return nil
  234. }
  235. for _, e := range osEns {
  236. if exists[e.Name()] {
  237. continue
  238. }
  239. if e.IsDir() {
  240. info, err := loadCacheDirInfo(c, append(lo2.ArrayClone(pathComps), e.Name()))
  241. if err != nil {
  242. continue
  243. }
  244. infos = append(infos, *info)
  245. } else {
  246. info, err := loadCacheFileInfo(c, append(lo2.ArrayClone(pathComps), e.Name()))
  247. if err != nil {
  248. continue
  249. }
  250. infos = append(infos, *info)
  251. }
  252. }
  253. return infos
  254. }
  255. // 删除指定路径的缓存文件或目录。删除目录时如果目录不为空,则会报错。
  256. func (c *Cache) Remove(pathComps []string) error {
  257. c.lock.Lock()
  258. defer c.lock.Unlock()
  259. node, ok := c.activeCache.WalkEnd(pathComps)
  260. if ok {
  261. if len(node.WordNexts) > 0 {
  262. return fuse.ErrNotEmpty
  263. }
  264. if node.Value != nil {
  265. node.Value.Delete()
  266. if node.Value.state.uploading != nil {
  267. node.Value.state.uploading.isDeleted = true
  268. }
  269. }
  270. node.RemoveSelf(true)
  271. logger.Debugf("active cache %v removed", pathComps)
  272. return nil
  273. }
  274. metaPath := c.GetCacheMetaPath(pathComps...)
  275. err := os.Remove(metaPath)
  276. if err == nil || os.IsNotExist(err) {
  277. logger.Debugf("local cache %v removed", pathComps)
  278. return nil
  279. }
  280. if errors.Is(err, syscall.ENOTEMPTY) {
  281. return fuse.ErrNotEmpty
  282. }
  283. return err
  284. }
  285. // 移动指定路径的缓存文件或目录到新的路径。如果目标路径已经存在,则会报错。
  286. //
  287. // 如果移动成功,则返回移动后的缓存文件或目录。如果文件或目录不存在,则返回nil。
  288. func (c *Cache) Move(pathComps []string, newPathComps []string) error {
  289. c.lock.Lock()
  290. defer c.lock.Unlock()
  291. _, ok := c.activeCache.WalkEnd(newPathComps)
  292. if ok {
  293. return fuse.ErrExists
  294. }
  295. newMetaPath := c.GetCacheMetaPath(newPathComps...)
  296. newDataPath := c.GetCacheDataPath(newPathComps...)
  297. _, err := os.Stat(newMetaPath)
  298. if err == nil {
  299. return fuse.ErrExists
  300. } else if !os.IsNotExist(err) {
  301. return err
  302. }
  303. metaPath := c.GetCacheMetaPath(pathComps...)
  304. dataPath := c.GetCacheDataPath(pathComps...)
  305. // 每个缓存文件持有meta文件和data文件的句柄,所以这里移动文件,不影响句柄的使用。
  306. // 只能忽略这里的错误
  307. os.Rename(metaPath, newMetaPath)
  308. os.Rename(dataPath, newDataPath)
  309. // 更新缓存
  310. oldNode, ok := c.activeCache.WalkEnd(pathComps)
  311. if ok {
  312. newNode := c.activeCache.CreateWords(newPathComps)
  313. newNode.Value = oldNode.Value
  314. newNode.WordNexts = oldNode.WordNexts
  315. oldNode.RemoveSelf(false)
  316. if newNode.Value != nil {
  317. newNode.Value.Move(newPathComps)
  318. }
  319. newNode.Iterate(func(path []string, node *trie.Node[*CacheFile], isWordNode bool) trie.VisitCtrl {
  320. if node.Value != nil {
  321. node.Value.Move(lo2.AppendNew(newPathComps, path...))
  322. }
  323. return trie.VisitContinue
  324. })
  325. }
  326. logger.Debugf("cache moved: %v -> %v", pathComps, newPathComps)
  327. return nil
  328. }
  329. type uploadingPackage struct {
  330. bktName string
  331. pkgName string
  332. pkg cdssdk.Package
  333. upObjs []*uploadingObject
  334. }
  335. type uploadingObject struct {
  336. pathComps []string
  337. cache *CacheFile
  338. reader *CacheFileHandle
  339. isDeleted bool
  340. isSuccess bool
  341. }
  342. func (c *Cache) scanningCache() {
  343. ticker := time.NewTicker(time.Second * 5)
  344. defer ticker.Stop()
  345. lastScanPath := []string{}
  346. for {
  347. select {
  348. case _, ok := <-c.cacheDone:
  349. if !ok {
  350. return
  351. }
  352. case <-ticker.C:
  353. }
  354. c.lock.Lock()
  355. type packageFullName struct {
  356. bktName string
  357. pkgName string
  358. }
  359. uploadingPkgs := make(map[packageFullName]*uploadingPackage)
  360. visitCnt := 0
  361. visitBreak := false
  362. node, _ := c.activeCache.WalkEnd(lastScanPath)
  363. node.Iterate(func(path []string, node *trie.Node[*CacheFile], isWordNode bool) trie.VisitCtrl {
  364. ch := node.Value
  365. if ch == nil {
  366. return trie.VisitContinue
  367. }
  368. if ch.state.refCount > 0 {
  369. logger.Debugf("skip cache %v, refCount: %v", path, ch.state.refCount)
  370. return trie.VisitContinue
  371. }
  372. visitCnt++
  373. if ch.Revision() > 0 {
  374. // 1. 本地缓存被修改了,如果一段时间内没有被使用,则进行上传
  375. // 不存放在Package里的文件,不需要上传
  376. if len(ch.pathComps) <= 2 {
  377. return trie.VisitContinue
  378. }
  379. if time.Since(ch.state.freeTime) > c.cfg.UploadPendingTime && ch.state.uploading == nil {
  380. fullName := packageFullName{ch.pathComps[0], ch.pathComps[1]}
  381. pkg, ok := uploadingPkgs[fullName]
  382. if !ok {
  383. pkg = &uploadingPackage{
  384. bktName: ch.pathComps[0],
  385. pkgName: ch.pathComps[1],
  386. }
  387. uploadingPkgs[fullName] = pkg
  388. }
  389. obj := &uploadingObject{
  390. pathComps: lo2.ArrayClone(ch.pathComps),
  391. cache: ch,
  392. reader: ch.OpenReadWhenScanning(),
  393. }
  394. pkg.upObjs = append(pkg.upObjs, obj)
  395. ch.state.uploading = obj
  396. }
  397. } else if ch.state.isLoaded {
  398. // 2. 本地缓存没有被修改,如果一段时间内没有被使用,则进行卸载
  399. if time.Since(ch.state.freeTime) > c.cfg.CacheActiveTime {
  400. ch.Unload()
  401. ch.state.isLoaded = false
  402. ch.state.unloadTime = time.Now()
  403. }
  404. } else {
  405. // 3. 卸载后的缓存,如果一段时间内没有被使用,则进行删除。
  406. // 能达到这个阶段,则肯定已经被同步到远端了
  407. if time.Since(ch.state.unloadTime) > c.cfg.CacheExpireTime {
  408. ch.Delete()
  409. node.RemoveSelf(true)
  410. }
  411. }
  412. // 每次最多遍历500个节点,防止占用锁太久
  413. if visitCnt > 500 {
  414. lastScanPath = lo2.ArrayClone(path)
  415. visitBreak = true
  416. return trie.VisitBreak
  417. }
  418. return trie.VisitContinue
  419. })
  420. if !visitBreak {
  421. lastScanPath = []string{}
  422. }
  423. c.lock.Unlock()
  424. if len(uploadingPkgs) > 0 {
  425. go c.doUploading(lo.Values(uploadingPkgs))
  426. }
  427. }
  428. }
  429. func (c *Cache) doUploading(pkgs []*uploadingPackage) {
  430. /// 1. 先查询每个Package的信息,如果不存在,则暂时不上传
  431. var sucPkgs []*uploadingPackage
  432. var failedPkgs []*uploadingPackage
  433. for _, pkg := range pkgs {
  434. // TODO 用户ID
  435. p, err := c.db.Package().GetUserPackageByName(c.db.DefCtx(), 1, pkg.bktName, pkg.pkgName)
  436. if err != nil {
  437. logger.Warnf("get user package %v/%v: %v", pkg.bktName, pkg.pkgName, err)
  438. failedPkgs = append(failedPkgs, pkg)
  439. continue
  440. }
  441. pkg.pkg = p
  442. sucPkgs = append(sucPkgs, pkg)
  443. }
  444. /// 2. 对于查询失败的Package,直接关闭文件,不进行上传
  445. // 在锁的保护下取消上传状态
  446. c.lock.Lock()
  447. for _, pkg := range failedPkgs {
  448. for _, obj := range pkg.upObjs {
  449. obj.cache.state.uploading = nil
  450. }
  451. }
  452. c.lock.Unlock()
  453. // 关闭文件必须在锁外
  454. for _, pkg := range failedPkgs {
  455. for _, obj := range pkg.upObjs {
  456. obj.reader.Close()
  457. }
  458. }
  459. /// 3. 开始上传每个Package
  460. for _, p := range sucPkgs {
  461. uploader, err := c.uploader.BeginUpdate(1, p.pkg.PackageID, 0, nil, nil)
  462. if err != nil {
  463. logger.Warnf("begin update package %v/%v: %v", p.bktName, p.pkgName, err)
  464. continue
  465. }
  466. upSuc := 0
  467. upSucAmt := int64(0)
  468. upFailed := 0
  469. upStartTime := time.Now()
  470. logger.Infof("begin uploading %v objects to package %v/%v", len(p.upObjs), p.bktName, p.pkgName)
  471. for _, o := range p.upObjs {
  472. rd := cacheFileReader{
  473. rw: o.reader,
  474. }
  475. counter := io2.Counter(&rd)
  476. err = uploader.Upload(cdssdk.JoinObjectPath(o.pathComps[2:]...), counter)
  477. if err != nil {
  478. logger.Warnf("upload object %v: %v", o.pathComps, err)
  479. upFailed++
  480. continue
  481. }
  482. o.isSuccess = true
  483. upSuc++
  484. upSucAmt += counter.Count()
  485. }
  486. // 在锁保护下登记上传结果
  487. c.lock.Lock()
  488. upCancel := 0
  489. upRename := 0
  490. // 检查是否有文件在上传期间发生了变化
  491. var sucObjs []*uploadingObject
  492. for _, o := range p.upObjs {
  493. o.cache.state.uploading = nil
  494. if !o.isSuccess {
  495. continue
  496. }
  497. oldPath := cdssdk.JoinObjectPath(o.pathComps[2:]...)
  498. newPath := cdssdk.JoinObjectPath(o.cache.pathComps[2:]...)
  499. if o.isDeleted {
  500. uploader.CancelObject(oldPath)
  501. upCancel++
  502. continue
  503. }
  504. // 如果对象移动到了另一个Package,那么也要取消上传
  505. if !lo2.ArrayEquals(o.pathComps[:2], o.cache.pathComps[:2]) {
  506. uploader.CancelObject(oldPath)
  507. upCancel++
  508. continue
  509. }
  510. // 只有仍在同Package内移动的对象才能直接重命名
  511. if newPath != oldPath {
  512. uploader.RenameObject(oldPath, newPath)
  513. upRename++
  514. }
  515. sucObjs = append(sucObjs, o)
  516. }
  517. _, err = uploader.Commit()
  518. if err != nil {
  519. logger.Warnf("commit update package %v/%v: %v", p.bktName, p.pkgName, err)
  520. } else {
  521. for _, obj := range sucObjs {
  522. obj.cache.RevisionUploaded(obj.reader.revision)
  523. }
  524. upTime := time.Since(upStartTime)
  525. logger.Infof("upload package %v/%v in %v, upload: %v, size: %v, speed: %v/s, cancel: %v, rename: %v",
  526. p.bktName, p.pkgName, upTime, upSuc, upSucAmt, bytesize.New(float64(upSucAmt)/upTime.Seconds()), upCancel, upRename)
  527. }
  528. c.lock.Unlock()
  529. // 在Cache锁以外关闭文件。
  530. // 关闭文件会影响refCount,所以无论是上传失败还是上传成功,都会在等待一段时间后才进行下一阶段的操作
  531. for _, obj := range p.upObjs {
  532. obj.reader.Close()
  533. }
  534. }
  535. }
  536. type cacheFileReader struct {
  537. rw *CacheFileHandle
  538. pos int64
  539. }
  540. func (r *cacheFileReader) Read(p []byte) (int, error) {
  541. n, err := r.rw.ReadAt(p, r.pos)
  542. r.pos += int64(n)
  543. if err != nil {
  544. return n, err
  545. }
  546. if n != len(p) {
  547. return n, io.EOF
  548. }
  549. return n, nil
  550. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。