set.go 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505
  1. /*
  2. Copyright 2018 The Kubernetes Authors.
  3. Licensed under the Apache License, Version 2.0 (the "License");
  4. you may not use this file except in compliance with the License.
  5. You may obtain a copy of the License at
  6. http://www.apache.org/licenses/LICENSE-2.0
  7. Unless required by applicable law or agreed to in writing, software
  8. distributed under the License is distributed on an "AS IS" BASIS,
  9. WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. See the License for the specific language governing permissions and
  11. limitations under the License.
  12. */
  13. package fieldpath
  14. import (
  15. "sort"
  16. "strings"
  17. "sigs.k8s.io/structured-merge-diff/v4/schema"
  18. )
  19. // Set identifies a set of fields.
  20. type Set struct {
  21. // Members lists fields that are part of the set.
  22. // TODO: will be serialized as a list of path elements.
  23. Members PathElementSet
  24. // Children lists child fields which themselves have children that are
  25. // members of the set. Appearance in this list does not imply membership.
  26. // Note: this is a tree, not an arbitrary graph.
  27. Children SetNodeMap
  28. }
  29. // NewSet makes a set from a list of paths.
  30. func NewSet(paths ...Path) *Set {
  31. s := &Set{}
  32. for _, p := range paths {
  33. s.Insert(p)
  34. }
  35. return s
  36. }
  37. // Insert adds the field identified by `p` to the set. Important: parent fields
  38. // are NOT added to the set; if that is desired, they must be added separately.
  39. func (s *Set) Insert(p Path) {
  40. if len(p) == 0 {
  41. // Zero-length path identifies the entire object; we don't
  42. // track top-level ownership.
  43. return
  44. }
  45. for {
  46. if len(p) == 1 {
  47. s.Members.Insert(p[0])
  48. return
  49. }
  50. s = s.Children.Descend(p[0])
  51. p = p[1:]
  52. }
  53. }
  54. // Union returns a Set containing elements which appear in either s or s2.
  55. func (s *Set) Union(s2 *Set) *Set {
  56. return &Set{
  57. Members: *s.Members.Union(&s2.Members),
  58. Children: *s.Children.Union(&s2.Children),
  59. }
  60. }
  61. // Intersection returns a Set containing leaf elements which appear in both s
  62. // and s2. Intersection can be constructed from Union and Difference operations
  63. // (example in the tests) but it's much faster to do it in one pass.
  64. func (s *Set) Intersection(s2 *Set) *Set {
  65. return &Set{
  66. Members: *s.Members.Intersection(&s2.Members),
  67. Children: *s.Children.Intersection(&s2.Children),
  68. }
  69. }
  70. // Difference returns a Set containing elements which:
  71. // * appear in s
  72. // * do not appear in s2
  73. //
  74. // In other words, for leaf fields, this acts like a regular set difference
  75. // operation. When non leaf fields are compared with leaf fields ("parents"
  76. // which contain "children"), the effect is:
  77. // * parent - child = parent
  78. // * child - parent = {empty set}
  79. func (s *Set) Difference(s2 *Set) *Set {
  80. return &Set{
  81. Members: *s.Members.Difference(&s2.Members),
  82. Children: *s.Children.Difference(s2),
  83. }
  84. }
  85. // RecursiveDifference returns a Set containing elements which:
  86. // * appear in s
  87. // * do not appear in s2
  88. //
  89. // Compared to a regular difference,
  90. // this removes every field **and its children** from s that is contained in s2.
  91. //
  92. // For example, with s containing `a.b.c` and s2 containing `a.b`,
  93. // a RecursiveDifference will result in `a`, as the entire node `a.b` gets removed.
  94. func (s *Set) RecursiveDifference(s2 *Set) *Set {
  95. return &Set{
  96. Members: *s.Members.Difference(&s2.Members),
  97. Children: *s.Children.RecursiveDifference(s2),
  98. }
  99. }
  100. // EnsureNamedFieldsAreMembers returns a Set that contains all the
  101. // fields in s, as well as all the named fields that are typically not
  102. // included. For example, a set made of "a.b.c" will end-up also owning
  103. // "a" if it's a named fields but not "a.b" if it's a map.
  104. func (s *Set) EnsureNamedFieldsAreMembers(sc *schema.Schema, tr schema.TypeRef) *Set {
  105. members := PathElementSet{
  106. members: make(sortedPathElements, 0, s.Members.Size()+len(s.Children.members)),
  107. }
  108. atom, _ := sc.Resolve(tr)
  109. members.members = append(members.members, s.Members.members...)
  110. for _, node := range s.Children.members {
  111. // Only insert named fields.
  112. if node.pathElement.FieldName != nil && atom.Map != nil {
  113. if _, has := atom.Map.FindField(*node.pathElement.FieldName); has {
  114. members.Insert(node.pathElement)
  115. }
  116. }
  117. }
  118. return &Set{
  119. Members: members,
  120. Children: *s.Children.EnsureNamedFieldsAreMembers(sc, tr),
  121. }
  122. }
  123. // Size returns the number of members of the set.
  124. func (s *Set) Size() int {
  125. return s.Members.Size() + s.Children.Size()
  126. }
  127. // Empty returns true if there are no members of the set. It is a separate
  128. // function from Size since it's common to check whether size > 0, and
  129. // potentially much faster to return as soon as a single element is found.
  130. func (s *Set) Empty() bool {
  131. if s.Members.Size() > 0 {
  132. return false
  133. }
  134. return s.Children.Empty()
  135. }
  136. // Has returns true if the field referenced by `p` is a member of the set.
  137. func (s *Set) Has(p Path) bool {
  138. if len(p) == 0 {
  139. // No one owns "the entire object"
  140. return false
  141. }
  142. for {
  143. if len(p) == 1 {
  144. return s.Members.Has(p[0])
  145. }
  146. var ok bool
  147. s, ok = s.Children.Get(p[0])
  148. if !ok {
  149. return false
  150. }
  151. p = p[1:]
  152. }
  153. }
  154. // Equals returns true if s and s2 have exactly the same members.
  155. func (s *Set) Equals(s2 *Set) bool {
  156. return s.Members.Equals(&s2.Members) && s.Children.Equals(&s2.Children)
  157. }
  158. // String returns the set one element per line.
  159. func (s *Set) String() string {
  160. elements := []string{}
  161. s.Iterate(func(p Path) {
  162. elements = append(elements, p.String())
  163. })
  164. return strings.Join(elements, "\n")
  165. }
  166. // Iterate calls f once for each field that is a member of the set (preorder
  167. // DFS). The path passed to f will be reused so make a copy if you wish to keep
  168. // it.
  169. func (s *Set) Iterate(f func(Path)) {
  170. s.iteratePrefix(Path{}, f)
  171. }
  172. func (s *Set) iteratePrefix(prefix Path, f func(Path)) {
  173. s.Members.Iterate(func(pe PathElement) { f(append(prefix, pe)) })
  174. s.Children.iteratePrefix(prefix, f)
  175. }
  176. // WithPrefix returns the subset of paths which begin with the given prefix,
  177. // with the prefix not included.
  178. func (s *Set) WithPrefix(pe PathElement) *Set {
  179. subset, ok := s.Children.Get(pe)
  180. if !ok {
  181. return NewSet()
  182. }
  183. return subset
  184. }
  185. // Leaves returns a set containing only the leaf paths
  186. // of a set.
  187. func (s *Set) Leaves() *Set {
  188. leaves := PathElementSet{}
  189. im := 0
  190. ic := 0
  191. // any members that are not also children are leaves
  192. outer:
  193. for im < len(s.Members.members) {
  194. member := s.Members.members[im]
  195. for ic < len(s.Children.members) {
  196. d := member.Compare(s.Children.members[ic].pathElement)
  197. if d == 0 {
  198. ic++
  199. im++
  200. continue outer
  201. } else if d < 0 {
  202. break
  203. } else /* if d > 0 */ {
  204. ic++
  205. }
  206. }
  207. leaves.members = append(leaves.members, member)
  208. im++
  209. }
  210. return &Set{
  211. Members: leaves,
  212. Children: *s.Children.Leaves(),
  213. }
  214. }
  215. // setNode is a pair of PathElement / Set, for the purpose of expressing
  216. // nested set membership.
  217. type setNode struct {
  218. pathElement PathElement
  219. set *Set
  220. }
  221. // SetNodeMap is a map of PathElement to subset.
  222. type SetNodeMap struct {
  223. members sortedSetNode
  224. }
  225. type sortedSetNode []setNode
  226. // Implement the sort interface; this would permit bulk creation, which would
  227. // be faster than doing it one at a time via Insert.
  228. func (s sortedSetNode) Len() int { return len(s) }
  229. func (s sortedSetNode) Less(i, j int) bool { return s[i].pathElement.Less(s[j].pathElement) }
  230. func (s sortedSetNode) Swap(i, j int) { s[i], s[j] = s[j], s[i] }
  231. // Descend adds pe to the set if necessary, returning the associated subset.
  232. func (s *SetNodeMap) Descend(pe PathElement) *Set {
  233. loc := sort.Search(len(s.members), func(i int) bool {
  234. return !s.members[i].pathElement.Less(pe)
  235. })
  236. if loc == len(s.members) {
  237. s.members = append(s.members, setNode{pathElement: pe, set: &Set{}})
  238. return s.members[loc].set
  239. }
  240. if s.members[loc].pathElement.Equals(pe) {
  241. return s.members[loc].set
  242. }
  243. s.members = append(s.members, setNode{})
  244. copy(s.members[loc+1:], s.members[loc:])
  245. s.members[loc] = setNode{pathElement: pe, set: &Set{}}
  246. return s.members[loc].set
  247. }
  248. // Size returns the sum of the number of members of all subsets.
  249. func (s *SetNodeMap) Size() int {
  250. count := 0
  251. for _, v := range s.members {
  252. count += v.set.Size()
  253. }
  254. return count
  255. }
  256. // Empty returns false if there's at least one member in some child set.
  257. func (s *SetNodeMap) Empty() bool {
  258. for _, n := range s.members {
  259. if !n.set.Empty() {
  260. return false
  261. }
  262. }
  263. return true
  264. }
  265. // Get returns (the associated set, true) or (nil, false) if there is none.
  266. func (s *SetNodeMap) Get(pe PathElement) (*Set, bool) {
  267. loc := sort.Search(len(s.members), func(i int) bool {
  268. return !s.members[i].pathElement.Less(pe)
  269. })
  270. if loc == len(s.members) {
  271. return nil, false
  272. }
  273. if s.members[loc].pathElement.Equals(pe) {
  274. return s.members[loc].set, true
  275. }
  276. return nil, false
  277. }
  278. // Equals returns true if s and s2 have the same structure (same nested
  279. // child sets).
  280. func (s *SetNodeMap) Equals(s2 *SetNodeMap) bool {
  281. if len(s.members) != len(s2.members) {
  282. return false
  283. }
  284. for i := range s.members {
  285. if !s.members[i].pathElement.Equals(s2.members[i].pathElement) {
  286. return false
  287. }
  288. if !s.members[i].set.Equals(s2.members[i].set) {
  289. return false
  290. }
  291. }
  292. return true
  293. }
  294. // Union returns a SetNodeMap with members that appear in either s or s2.
  295. func (s *SetNodeMap) Union(s2 *SetNodeMap) *SetNodeMap {
  296. out := &SetNodeMap{}
  297. i, j := 0, 0
  298. for i < len(s.members) && j < len(s2.members) {
  299. if s.members[i].pathElement.Less(s2.members[j].pathElement) {
  300. out.members = append(out.members, s.members[i])
  301. i++
  302. } else {
  303. if !s2.members[j].pathElement.Less(s.members[i].pathElement) {
  304. out.members = append(out.members, setNode{pathElement: s.members[i].pathElement, set: s.members[i].set.Union(s2.members[j].set)})
  305. i++
  306. } else {
  307. out.members = append(out.members, s2.members[j])
  308. }
  309. j++
  310. }
  311. }
  312. if i < len(s.members) {
  313. out.members = append(out.members, s.members[i:]...)
  314. }
  315. if j < len(s2.members) {
  316. out.members = append(out.members, s2.members[j:]...)
  317. }
  318. return out
  319. }
  320. // Intersection returns a SetNodeMap with members that appear in both s and s2.
  321. func (s *SetNodeMap) Intersection(s2 *SetNodeMap) *SetNodeMap {
  322. out := &SetNodeMap{}
  323. i, j := 0, 0
  324. for i < len(s.members) && j < len(s2.members) {
  325. if s.members[i].pathElement.Less(s2.members[j].pathElement) {
  326. i++
  327. } else {
  328. if !s2.members[j].pathElement.Less(s.members[i].pathElement) {
  329. res := s.members[i].set.Intersection(s2.members[j].set)
  330. if !res.Empty() {
  331. out.members = append(out.members, setNode{pathElement: s.members[i].pathElement, set: res})
  332. }
  333. i++
  334. }
  335. j++
  336. }
  337. }
  338. return out
  339. }
  340. // Difference returns a SetNodeMap with members that appear in s but not in s2.
  341. func (s *SetNodeMap) Difference(s2 *Set) *SetNodeMap {
  342. out := &SetNodeMap{}
  343. i, j := 0, 0
  344. for i < len(s.members) && j < len(s2.Children.members) {
  345. if s.members[i].pathElement.Less(s2.Children.members[j].pathElement) {
  346. out.members = append(out.members, setNode{pathElement: s.members[i].pathElement, set: s.members[i].set})
  347. i++
  348. } else {
  349. if !s2.Children.members[j].pathElement.Less(s.members[i].pathElement) {
  350. diff := s.members[i].set.Difference(s2.Children.members[j].set)
  351. // We aren't permitted to add nodes with no elements.
  352. if !diff.Empty() {
  353. out.members = append(out.members, setNode{pathElement: s.members[i].pathElement, set: diff})
  354. }
  355. i++
  356. }
  357. j++
  358. }
  359. }
  360. if i < len(s.members) {
  361. out.members = append(out.members, s.members[i:]...)
  362. }
  363. return out
  364. }
  365. // RecursiveDifference returns a SetNodeMap with members that appear in s but not in s2.
  366. //
  367. // Compared to a regular difference,
  368. // this removes every field **and its children** from s that is contained in s2.
  369. //
  370. // For example, with s containing `a.b.c` and s2 containing `a.b`,
  371. // a RecursiveDifference will result in `a`, as the entire node `a.b` gets removed.
  372. func (s *SetNodeMap) RecursiveDifference(s2 *Set) *SetNodeMap {
  373. out := &SetNodeMap{}
  374. i, j := 0, 0
  375. for i < len(s.members) && j < len(s2.Children.members) {
  376. if s.members[i].pathElement.Less(s2.Children.members[j].pathElement) {
  377. if !s2.Members.Has(s.members[i].pathElement) {
  378. out.members = append(out.members, setNode{pathElement: s.members[i].pathElement, set: s.members[i].set})
  379. }
  380. i++
  381. } else {
  382. if !s2.Children.members[j].pathElement.Less(s.members[i].pathElement) {
  383. if !s2.Members.Has(s.members[i].pathElement) {
  384. diff := s.members[i].set.RecursiveDifference(s2.Children.members[j].set)
  385. if !diff.Empty() {
  386. out.members = append(out.members, setNode{pathElement: s.members[i].pathElement, set: diff})
  387. }
  388. }
  389. i++
  390. }
  391. j++
  392. }
  393. }
  394. if i < len(s.members) {
  395. for _, c := range s.members[i:] {
  396. if !s2.Members.Has(c.pathElement) {
  397. out.members = append(out.members, c)
  398. }
  399. }
  400. }
  401. return out
  402. }
  403. // EnsureNamedFieldsAreMembers returns a set that contains all the named fields along with the leaves.
  404. func (s *SetNodeMap) EnsureNamedFieldsAreMembers(sc *schema.Schema, tr schema.TypeRef) *SetNodeMap {
  405. out := make(sortedSetNode, 0, s.Size())
  406. atom, _ := sc.Resolve(tr)
  407. for _, member := range s.members {
  408. tr := schema.TypeRef{}
  409. if member.pathElement.FieldName != nil && atom.Map != nil {
  410. tr = atom.Map.ElementType
  411. if sf, ok := atom.Map.FindField(*member.pathElement.FieldName); ok {
  412. tr = sf.Type
  413. }
  414. } else if member.pathElement.Key != nil && atom.List != nil {
  415. tr = atom.List.ElementType
  416. }
  417. out = append(out, setNode{
  418. pathElement: member.pathElement,
  419. set: member.set.EnsureNamedFieldsAreMembers(sc, tr),
  420. })
  421. }
  422. return &SetNodeMap{
  423. members: out,
  424. }
  425. }
  426. // Iterate calls f for each PathElement in the set.
  427. func (s *SetNodeMap) Iterate(f func(PathElement)) {
  428. for _, n := range s.members {
  429. f(n.pathElement)
  430. }
  431. }
  432. func (s *SetNodeMap) iteratePrefix(prefix Path, f func(Path)) {
  433. for _, n := range s.members {
  434. pe := n.pathElement
  435. n.set.iteratePrefix(append(prefix, pe), f)
  436. }
  437. }
  438. // Leaves returns a SetNodeMap containing
  439. // only setNodes with leaf PathElements.
  440. func (s *SetNodeMap) Leaves() *SetNodeMap {
  441. out := &SetNodeMap{}
  442. out.members = make(sortedSetNode, len(s.members))
  443. for i, n := range s.members {
  444. out.members[i] = setNode{
  445. pathElement: n.pathElement,
  446. set: n.set.Leaves(),
  447. }
  448. }
  449. return out
  450. }