You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

generator.go 14 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488
  1. package gen
  2. import (
  3. "fmt"
  4. "math"
  5. "gitlink.org.cn/cloudream/common/pkgs/ioswitch/dag"
  6. cdssdk "gitlink.org.cn/cloudream/common/sdks/storage"
  7. "gitlink.org.cn/cloudream/common/utils/lo2"
  8. "gitlink.org.cn/cloudream/common/utils/math2"
  9. "gitlink.org.cn/cloudream/storage/common/pkgs/ioswitch2"
  10. "gitlink.org.cn/cloudream/storage/common/pkgs/ioswitch2/ops2"
  11. "gitlink.org.cn/cloudream/storage/common/pkgs/ioswitch2/parser/state"
  12. "gitlink.org.cn/cloudream/storage/common/pkgs/storage/types"
  13. )
  14. // 检查使用不同编码时参数是否设置到位
  15. func CheckEncodingParams(ctx *state.GenerateState) error {
  16. for _, f := range ctx.Ft.Froms {
  17. if f.GetStreamIndex().IsEC() {
  18. ctx.UseEC = true
  19. if ctx.Ft.ECParam == nil {
  20. return fmt.Errorf("EC encoding parameters not set")
  21. }
  22. }
  23. if f.GetStreamIndex().IsSegment() {
  24. ctx.UseSegment = true
  25. if ctx.Ft.SegmentParam == nil {
  26. return fmt.Errorf("segment parameters not set")
  27. }
  28. }
  29. }
  30. for _, t := range ctx.Ft.Toes {
  31. if t.GetStreamIndex().IsEC() {
  32. ctx.UseEC = true
  33. if ctx.Ft.ECParam == nil {
  34. return fmt.Errorf("EC encoding parameters not set")
  35. }
  36. }
  37. if t.GetStreamIndex().IsSegment() {
  38. ctx.UseSegment = true
  39. if ctx.Ft.SegmentParam == nil {
  40. return fmt.Errorf("segment parameters not set")
  41. }
  42. }
  43. }
  44. return nil
  45. }
  46. // 计算输入流的打开范围。如果From或者To中包含EC的流,则会将打开范围扩大到条带大小的整数倍。
  47. func CalcStreamRange(ctx *state.GenerateState) {
  48. rng := math2.NewRange(math.MaxInt64, 0)
  49. for _, to := range ctx.Ft.Toes {
  50. strIdx := to.GetStreamIndex()
  51. if strIdx.IsRaw() {
  52. toRng := to.GetRange()
  53. rng.ExtendStart(toRng.Offset)
  54. if toRng.Length != nil {
  55. rng.ExtendEnd(toRng.Offset + *toRng.Length)
  56. } else {
  57. rng.Length = nil
  58. }
  59. } else if strIdx.IsEC() {
  60. toRng := to.GetRange()
  61. stripSize := ctx.Ft.ECParam.StripSize()
  62. blkStartIndex := math2.FloorDiv(toRng.Offset, int64(ctx.Ft.ECParam.ChunkSize))
  63. rng.ExtendStart(blkStartIndex * stripSize)
  64. if toRng.Length != nil {
  65. blkEndIndex := math2.CeilDiv(toRng.Offset+*toRng.Length, int64(ctx.Ft.ECParam.ChunkSize))
  66. rng.ExtendEnd(blkEndIndex * stripSize)
  67. } else {
  68. rng.Length = nil
  69. }
  70. } else if strIdx.IsSegment() {
  71. // Segment节点的Range是相对于本段的,需要加上本段的起始位置
  72. toRng := to.GetRange()
  73. segStart := ctx.Ft.SegmentParam.CalcSegmentStart(strIdx.Index)
  74. offset := toRng.Offset + segStart
  75. rng.ExtendStart(offset)
  76. if toRng.Length != nil {
  77. rng.ExtendEnd(offset + *toRng.Length)
  78. } else {
  79. rng.Length = nil
  80. }
  81. }
  82. }
  83. if ctx.UseEC {
  84. stripSize := ctx.Ft.ECParam.StripSize()
  85. rng.ExtendStart(math2.Floor(rng.Offset, stripSize))
  86. if rng.Length != nil {
  87. rng.ExtendEnd(math2.Ceil(rng.Offset+*rng.Length, stripSize))
  88. }
  89. }
  90. ctx.StreamRange = rng
  91. }
  92. func Extend(ctx *state.GenerateState) error {
  93. for _, fr := range ctx.Ft.Froms {
  94. frNode, err := buildFromNode(ctx, fr)
  95. if err != nil {
  96. return err
  97. }
  98. ctx.FromNodes[fr] = frNode
  99. ctx.IndexedStreams = append(ctx.IndexedStreams, state.IndexedStream{
  100. Stream: frNode.Output().Var(),
  101. StreamIndex: fr.GetStreamIndex(),
  102. })
  103. // 对于完整文件的From,生成Split指令
  104. if fr.GetStreamIndex().IsRaw() {
  105. // 只有输入输出需要EC编码的块时,才生成相关指令
  106. if ctx.UseEC {
  107. splitNode := ctx.DAG.NewChunkedSplit(ctx.Ft.ECParam.ChunkSize, ctx.Ft.ECParam.K)
  108. splitNode.Split(frNode.Output().Var())
  109. for i := 0; i < ctx.Ft.ECParam.K; i++ {
  110. ctx.IndexedStreams = append(ctx.IndexedStreams, state.IndexedStream{
  111. Stream: splitNode.SubStream(i),
  112. StreamIndex: ioswitch2.ECStream(i),
  113. })
  114. }
  115. }
  116. // 同上
  117. if ctx.UseSegment {
  118. splitNode := ctx.DAG.NewSegmentSplit(ctx.Ft.SegmentParam.Segments)
  119. frNode.Output().Var().ToSlot(splitNode.InputSlot())
  120. for i := 0; i < len(ctx.Ft.SegmentParam.Segments); i++ {
  121. ctx.IndexedStreams = append(ctx.IndexedStreams, state.IndexedStream{
  122. Stream: splitNode.Segment(i),
  123. StreamIndex: ioswitch2.SegmentStream(i),
  124. })
  125. }
  126. }
  127. }
  128. }
  129. if ctx.UseEC {
  130. // 如果有K个不同的文件块流,则生成Multiply指令,同时针对其生成的流,生成Join指令
  131. ecInputStrs := make(map[int]*dag.StreamVar)
  132. for _, s := range ctx.IndexedStreams {
  133. if s.StreamIndex.IsEC() && ecInputStrs[s.StreamIndex.Index] == nil {
  134. ecInputStrs[s.StreamIndex.Index] = s.Stream
  135. if len(ecInputStrs) == ctx.Ft.ECParam.K {
  136. break
  137. }
  138. }
  139. }
  140. if len(ecInputStrs) == ctx.Ft.ECParam.K {
  141. mulNode := ctx.DAG.NewECMultiply(*ctx.Ft.ECParam)
  142. for i, s := range ecInputStrs {
  143. mulNode.AddInput(s, i)
  144. }
  145. for i := 0; i < ctx.Ft.ECParam.N; i++ {
  146. ctx.IndexedStreams = append(ctx.IndexedStreams, state.IndexedStream{
  147. Stream: mulNode.NewOutput(i),
  148. StreamIndex: ioswitch2.ECStream(i),
  149. })
  150. }
  151. joinNode := ctx.DAG.NewChunkedJoin(ctx.Ft.ECParam.ChunkSize)
  152. for i := 0; i < ctx.Ft.ECParam.K; i++ {
  153. // 不可能找不到流
  154. joinNode.AddInput(findOutputStream(ctx, ioswitch2.ECStream(i)))
  155. }
  156. ctx.IndexedStreams = append(ctx.IndexedStreams, state.IndexedStream{
  157. Stream: joinNode.Joined(),
  158. StreamIndex: ioswitch2.RawStream(),
  159. })
  160. }
  161. }
  162. if ctx.UseSegment {
  163. // 先假设有所有的顺序分段,生成Join指令,后续根据Range再实际计算是否缺少流
  164. joinNode := ctx.DAG.NewSegmentJoin(ctx.Ft.SegmentParam.Segments)
  165. for i := 0; i < ctx.Ft.SegmentParam.SegmentCount(); i++ {
  166. str := findOutputStream(ctx, ioswitch2.SegmentStream(i))
  167. if str != nil {
  168. str.ToSlot(joinNode.InputSlot(i))
  169. }
  170. }
  171. ctx.IndexedStreams = append(ctx.IndexedStreams, state.IndexedStream{
  172. Stream: joinNode.Joined(),
  173. StreamIndex: ioswitch2.RawStream(),
  174. })
  175. // SegmentJoin生成的Join指令可以用来生成EC块
  176. if ctx.UseEC {
  177. splitNode := ctx.DAG.NewChunkedSplit(ctx.Ft.ECParam.ChunkSize, ctx.Ft.ECParam.K)
  178. splitNode.Split(joinNode.Joined())
  179. mulNode := ctx.DAG.NewECMultiply(*ctx.Ft.ECParam)
  180. for i := 0; i < ctx.Ft.ECParam.K; i++ {
  181. mulNode.AddInput(splitNode.SubStream(i), i)
  182. ctx.IndexedStreams = append(ctx.IndexedStreams, state.IndexedStream{
  183. Stream: splitNode.SubStream(i),
  184. StreamIndex: ioswitch2.ECStream(i),
  185. })
  186. }
  187. for i := 0; i < ctx.Ft.ECParam.N; i++ {
  188. ctx.IndexedStreams = append(ctx.IndexedStreams, state.IndexedStream{
  189. Stream: mulNode.NewOutput(i),
  190. StreamIndex: ioswitch2.ECStream(i),
  191. })
  192. }
  193. }
  194. }
  195. // 为每一个To找到一个输入流
  196. for _, to := range ctx.Ft.Toes {
  197. toNode, err := buildToNode(ctx, to)
  198. if err != nil {
  199. return err
  200. }
  201. ctx.ToNodes[to] = toNode
  202. str := findOutputStream(ctx, to.GetStreamIndex())
  203. if str == nil {
  204. return fmt.Errorf("no output stream found for data index %d", to.GetStreamIndex())
  205. }
  206. toNode.SetInput(str)
  207. }
  208. return nil
  209. }
  210. func buildFromNode(ctx *state.GenerateState, f ioswitch2.From) (ops2.FromNode, error) {
  211. var repRange math2.Range
  212. repRange.Offset = ctx.StreamRange.Offset
  213. if ctx.StreamRange.Length != nil {
  214. repRngLen := *ctx.StreamRange.Length
  215. repRange.Length = &repRngLen
  216. }
  217. var blkRange math2.Range
  218. if ctx.UseEC {
  219. blkRange.Offset = ctx.StreamRange.Offset / int64(ctx.Ft.ECParam.ChunkSize*ctx.Ft.ECParam.K) * int64(ctx.Ft.ECParam.ChunkSize)
  220. if ctx.StreamRange.Length != nil {
  221. blkRngLen := *ctx.StreamRange.Length / int64(ctx.Ft.ECParam.ChunkSize*ctx.Ft.ECParam.K) * int64(ctx.Ft.ECParam.ChunkSize)
  222. blkRange.Length = &blkRngLen
  223. }
  224. }
  225. switch f := f.(type) {
  226. case *ioswitch2.FromShardstore:
  227. t := ctx.DAG.NewShardRead(f, f.Storage.Storage.StorageID, types.NewOpen(f.FileHash))
  228. if f.StreamIndex.IsRaw() {
  229. t.Open.WithNullableLength(repRange.Offset, repRange.Length)
  230. } else if f.StreamIndex.IsEC() {
  231. t.Open.WithNullableLength(blkRange.Offset, blkRange.Length)
  232. } else if f.StreamIndex.IsSegment() {
  233. segStart := ctx.Ft.SegmentParam.CalcSegmentStart(f.StreamIndex.Index)
  234. segLen := ctx.Ft.SegmentParam.Segments[f.StreamIndex.Index]
  235. segEnd := segStart + segLen
  236. // 打开的范围不超过本段的范围
  237. openOff := ctx.StreamRange.Offset - segStart
  238. openOff = math2.Clamp(openOff, 0, segLen)
  239. openLen := segLen
  240. if ctx.StreamRange.Length != nil {
  241. strEnd := ctx.StreamRange.Offset + *ctx.StreamRange.Length
  242. openEnd := math2.Min(strEnd, segEnd)
  243. openLen = openEnd - segStart - openOff
  244. }
  245. t.Open.WithNullableLength(openOff, &openLen)
  246. }
  247. switch addr := f.Hub.Address.(type) {
  248. case *cdssdk.HttpAddressInfo:
  249. t.Env().ToEnvWorker(&ioswitch2.HttpHubWorker{Hub: f.Hub})
  250. t.Env().Pinned = true
  251. case *cdssdk.GRPCAddressInfo:
  252. t.Env().ToEnvWorker(&ioswitch2.AgentWorker{Hub: f.Hub, Address: *addr})
  253. t.Env().Pinned = true
  254. default:
  255. return nil, fmt.Errorf("unsupported node address type %T", addr)
  256. }
  257. return t, nil
  258. case *ioswitch2.FromDriver:
  259. n := ctx.DAG.NewFromDriver(f, f.Handle)
  260. n.Env().ToEnvDriver()
  261. n.Env().Pinned = true
  262. if f.StreamIndex.IsRaw() {
  263. f.Handle.RangeHint.Offset = repRange.Offset
  264. f.Handle.RangeHint.Length = repRange.Length
  265. } else if f.StreamIndex.IsEC() {
  266. f.Handle.RangeHint.Offset = blkRange.Offset
  267. f.Handle.RangeHint.Length = blkRange.Length
  268. } else if f.StreamIndex.IsSegment() {
  269. segStart := ctx.Ft.SegmentParam.CalcSegmentStart(f.StreamIndex.Index)
  270. segLen := ctx.Ft.SegmentParam.Segments[f.StreamIndex.Index]
  271. segEnd := segStart + segLen
  272. // 打开的范围不超过本段的范围
  273. openOff := repRange.Offset - segStart
  274. openOff = math2.Clamp(openOff, 0, segLen)
  275. openLen := segLen
  276. if repRange.Length != nil {
  277. repEnd := repRange.Offset + *repRange.Length
  278. openEnd := math2.Min(repEnd, segEnd)
  279. openLen = openEnd - openOff
  280. }
  281. f.Handle.RangeHint.Offset = openOff
  282. f.Handle.RangeHint.Length = &openLen
  283. }
  284. return n, nil
  285. default:
  286. return nil, fmt.Errorf("unsupported from type %T", f)
  287. }
  288. }
  289. func buildToNode(ctx *state.GenerateState, t ioswitch2.To) (ops2.ToNode, error) {
  290. switch t := t.(type) {
  291. case *ioswitch2.ToShardStore:
  292. n := ctx.DAG.NewShardWrite(t, t.Storage, t.FileHashStoreKey)
  293. if err := setEnvByAddress(n, t.Hub, t.Hub.Address); err != nil {
  294. return nil, err
  295. }
  296. n.Env().Pinned = true
  297. return n, nil
  298. case *ioswitch2.ToDriver:
  299. n := ctx.DAG.NewToDriver(t, t.Handle)
  300. n.Env().ToEnvDriver()
  301. n.Env().Pinned = true
  302. return n, nil
  303. case *ioswitch2.LoadToShared:
  304. n := ctx.DAG.NewSharedLoad(t, t.Storage, t.ObjectPath)
  305. if err := setEnvByAddress(n, t.Hub, t.Hub.Address); err != nil {
  306. return nil, err
  307. }
  308. n.Env().Pinned = true
  309. return n, nil
  310. default:
  311. return nil, fmt.Errorf("unsupported to type %T", t)
  312. }
  313. }
  314. func setEnvByAddress(n dag.Node, hub cdssdk.Hub, addr cdssdk.HubAddressInfo) error {
  315. switch addr := addr.(type) {
  316. case *cdssdk.HttpAddressInfo:
  317. n.Env().ToEnvWorker(&ioswitch2.HttpHubWorker{Hub: hub})
  318. case *cdssdk.GRPCAddressInfo:
  319. n.Env().ToEnvWorker(&ioswitch2.AgentWorker{Hub: hub, Address: *addr})
  320. default:
  321. return fmt.Errorf("unsupported node address type %T", addr)
  322. }
  323. return nil
  324. }
  325. func findOutputStream(ctx *state.GenerateState, streamIndex ioswitch2.StreamIndex) *dag.StreamVar {
  326. var ret *dag.StreamVar
  327. for _, s := range ctx.IndexedStreams {
  328. if s.StreamIndex == streamIndex {
  329. ret = s.Stream
  330. break
  331. }
  332. }
  333. return ret
  334. }
  335. // 根据StreamRange,调整SegmentSplit中分段的个数和每段的大小
  336. func FixSegmentSplit(ctx *state.GenerateState) error {
  337. var err error
  338. dag.WalkOnlyType[*ops2.SegmentSplitNode](ctx.DAG.Graph, func(node *ops2.SegmentSplitNode) bool {
  339. var strEnd *int64
  340. if ctx.StreamRange.Length != nil {
  341. e := ctx.StreamRange.Offset + *ctx.StreamRange.Length
  342. strEnd = &e
  343. }
  344. startSeg, endSeg := ctx.Ft.SegmentParam.CalcSegmentRange(ctx.StreamRange.Offset, strEnd)
  345. // 关闭超出范围的分段
  346. for i := endSeg; i < len(node.Segments); i++ {
  347. node.OutputStreams().Get(i).ClearAllDst()
  348. }
  349. node.OutputStreams().Slots.RemoveRange(endSeg, ctx.Ft.SegmentParam.SegmentCount()-endSeg)
  350. node.Segments = lo2.RemoveRange(node.Segments, endSeg, ctx.Ft.SegmentParam.SegmentCount()-endSeg)
  351. for i := 0; i < startSeg; i++ {
  352. node.OutputStreams().Get(i).ClearAllDst()
  353. }
  354. node.OutputStreams().Slots.RemoveRange(0, startSeg)
  355. node.Segments = lo2.RemoveRange(node.Segments, 0, startSeg)
  356. // StreamRange开始的位置可能在某个分段的中间,此时这个分段的大小等于流开始位置到分段结束位置的距离
  357. startSegStart := ctx.Ft.SegmentParam.CalcSegmentStart(startSeg)
  358. node.Segments[0] -= ctx.StreamRange.Offset - startSegStart
  359. // StreamRange结束的位置可能在某个分段的中间,此时这个分段的大小就等于流结束位置到分段起始位置的距离
  360. if strEnd != nil {
  361. endSegStart := ctx.Ft.SegmentParam.CalcSegmentStart(endSeg - 1)
  362. node.Segments[len(node.Segments)-1] = *strEnd - endSegStart
  363. }
  364. return true
  365. })
  366. return err
  367. }
  368. // 从SegmentJoin中删除未使用的分段
  369. func FixSegmentJoin(ctx *state.GenerateState) error {
  370. var err error
  371. dag.WalkOnlyType[*ops2.SegmentJoinNode](ctx.DAG.Graph, func(node *ops2.SegmentJoinNode) bool {
  372. start := ctx.StreamRange.Offset
  373. var end *int64
  374. if ctx.StreamRange.Length != nil {
  375. e := ctx.StreamRange.Offset + *ctx.StreamRange.Length
  376. end = &e
  377. }
  378. startSeg, endSeg := ctx.Ft.SegmentParam.CalcSegmentRange(start, end)
  379. // 关闭超出范围的分段
  380. for i := endSeg; i < len(node.Segments); i++ {
  381. node.InputStreams().Get(i).NotTo(node)
  382. }
  383. node.InputStreams().Slots.RemoveRange(endSeg, ctx.Ft.SegmentParam.SegmentCount()-endSeg)
  384. node.Segments = lo2.RemoveRange(node.Segments, endSeg, ctx.Ft.SegmentParam.SegmentCount()-endSeg)
  385. for i := 0; i < startSeg; i++ {
  386. node.InputStreams().Get(i).NotTo(node)
  387. }
  388. node.InputStreams().Slots.RemoveRange(0, startSeg)
  389. node.Segments = lo2.RemoveRange(node.Segments, 0, startSeg)
  390. // StreamRange开始的位置可能在某个分段的中间,此时这个分段的大小等于流开始位置到分段结束位置的距离
  391. startSegStart := ctx.Ft.SegmentParam.CalcSegmentStart(startSeg)
  392. node.Segments[0] -= ctx.StreamRange.Offset - startSegStart
  393. // 检查一下必须的分段是否都被加入到Join中
  394. for i := 0; i < node.InputStreams().Len(); i++ {
  395. if node.InputStreams().Get(i) == nil {
  396. err = fmt.Errorf("segment %v missed to join an raw stream", i+startSeg)
  397. return false
  398. }
  399. }
  400. return true
  401. })
  402. return err
  403. }

本项目旨在将云际存储公共基础设施化,使个人及企业可低门槛使用高效的云际存储服务(安装开箱即用云际存储客户端即可,无需关注其他组件的部署),同时支持用户灵活便捷定制云际存储的功能细节。