setutil.go 8.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550
  1. package roaring
  2. func equal(a, b []uint16) bool {
  3. if len(a) != len(b) {
  4. return false
  5. }
  6. for i := range a {
  7. if a[i] != b[i] {
  8. return false
  9. }
  10. }
  11. return true
  12. }
  13. func difference(set1 []uint16, set2 []uint16, buffer []uint16) int {
  14. if 0 == len(set2) {
  15. buffer = buffer[:len(set1)]
  16. for k := 0; k < len(set1); k++ {
  17. buffer[k] = set1[k]
  18. }
  19. return len(set1)
  20. }
  21. if 0 == len(set1) {
  22. return 0
  23. }
  24. pos := 0
  25. k1 := 0
  26. k2 := 0
  27. buffer = buffer[:cap(buffer)]
  28. s1 := set1[k1]
  29. s2 := set2[k2]
  30. for {
  31. if s1 < s2 {
  32. buffer[pos] = s1
  33. pos++
  34. k1++
  35. if k1 >= len(set1) {
  36. break
  37. }
  38. s1 = set1[k1]
  39. } else if s1 == s2 {
  40. k1++
  41. k2++
  42. if k1 >= len(set1) {
  43. break
  44. }
  45. s1 = set1[k1]
  46. if k2 >= len(set2) {
  47. for ; k1 < len(set1); k1++ {
  48. buffer[pos] = set1[k1]
  49. pos++
  50. }
  51. break
  52. }
  53. s2 = set2[k2]
  54. } else { // if (val1>val2)
  55. k2++
  56. if k2 >= len(set2) {
  57. for ; k1 < len(set1); k1++ {
  58. buffer[pos] = set1[k1]
  59. pos++
  60. }
  61. break
  62. }
  63. s2 = set2[k2]
  64. }
  65. }
  66. return pos
  67. }
  68. func exclusiveUnion2by2(set1 []uint16, set2 []uint16, buffer []uint16) int {
  69. if 0 == len(set2) {
  70. buffer = buffer[:len(set1)]
  71. copy(buffer, set1[:])
  72. return len(set1)
  73. }
  74. if 0 == len(set1) {
  75. buffer = buffer[:len(set2)]
  76. copy(buffer, set2[:])
  77. return len(set2)
  78. }
  79. pos := 0
  80. k1 := 0
  81. k2 := 0
  82. s1 := set1[k1]
  83. s2 := set2[k2]
  84. buffer = buffer[:cap(buffer)]
  85. for {
  86. if s1 < s2 {
  87. buffer[pos] = s1
  88. pos++
  89. k1++
  90. if k1 >= len(set1) {
  91. for ; k2 < len(set2); k2++ {
  92. buffer[pos] = set2[k2]
  93. pos++
  94. }
  95. break
  96. }
  97. s1 = set1[k1]
  98. } else if s1 == s2 {
  99. k1++
  100. k2++
  101. if k1 >= len(set1) {
  102. for ; k2 < len(set2); k2++ {
  103. buffer[pos] = set2[k2]
  104. pos++
  105. }
  106. break
  107. }
  108. if k2 >= len(set2) {
  109. for ; k1 < len(set1); k1++ {
  110. buffer[pos] = set1[k1]
  111. pos++
  112. }
  113. break
  114. }
  115. s1 = set1[k1]
  116. s2 = set2[k2]
  117. } else { // if (val1>val2)
  118. buffer[pos] = s2
  119. pos++
  120. k2++
  121. if k2 >= len(set2) {
  122. for ; k1 < len(set1); k1++ {
  123. buffer[pos] = set1[k1]
  124. pos++
  125. }
  126. break
  127. }
  128. s2 = set2[k2]
  129. }
  130. }
  131. return pos
  132. }
  133. func union2by2Cardinality(set1 []uint16, set2 []uint16) int {
  134. pos := 0
  135. k1 := 0
  136. k2 := 0
  137. if 0 == len(set2) {
  138. return len(set1)
  139. }
  140. if 0 == len(set1) {
  141. return len(set2)
  142. }
  143. s1 := set1[k1]
  144. s2 := set2[k2]
  145. for {
  146. if s1 < s2 {
  147. pos++
  148. k1++
  149. if k1 >= len(set1) {
  150. pos += len(set2) - k2
  151. break
  152. }
  153. s1 = set1[k1]
  154. } else if s1 == s2 {
  155. pos++
  156. k1++
  157. k2++
  158. if k1 >= len(set1) {
  159. pos += len(set2) - k2
  160. break
  161. }
  162. if k2 >= len(set2) {
  163. pos += len(set1) - k1
  164. break
  165. }
  166. s1 = set1[k1]
  167. s2 = set2[k2]
  168. } else { // if (set1[k1]>set2[k2])
  169. pos++
  170. k2++
  171. if k2 >= len(set2) {
  172. pos += len(set1) - k1
  173. break
  174. }
  175. s2 = set2[k2]
  176. }
  177. }
  178. return pos
  179. }
  180. func intersection2by2(
  181. set1 []uint16,
  182. set2 []uint16,
  183. buffer []uint16) int {
  184. if len(set1)*64 < len(set2) {
  185. return onesidedgallopingintersect2by2(set1, set2, buffer)
  186. } else if len(set2)*64 < len(set1) {
  187. return onesidedgallopingintersect2by2(set2, set1, buffer)
  188. } else {
  189. return localintersect2by2(set1, set2, buffer)
  190. }
  191. }
  192. func intersection2by2Cardinality(
  193. set1 []uint16,
  194. set2 []uint16) int {
  195. if len(set1)*64 < len(set2) {
  196. return onesidedgallopingintersect2by2Cardinality(set1, set2)
  197. } else if len(set2)*64 < len(set1) {
  198. return onesidedgallopingintersect2by2Cardinality(set2, set1)
  199. } else {
  200. return localintersect2by2Cardinality(set1, set2)
  201. }
  202. }
  203. func intersects2by2(
  204. set1 []uint16,
  205. set2 []uint16) bool {
  206. // could be optimized if one set is much larger than the other one
  207. if (0 == len(set1)) || (0 == len(set2)) {
  208. return false
  209. }
  210. k1 := 0
  211. k2 := 0
  212. s1 := set1[k1]
  213. s2 := set2[k2]
  214. mainwhile:
  215. for {
  216. if s2 < s1 {
  217. for {
  218. k2++
  219. if k2 == len(set2) {
  220. break mainwhile
  221. }
  222. s2 = set2[k2]
  223. if s2 >= s1 {
  224. break
  225. }
  226. }
  227. }
  228. if s1 < s2 {
  229. for {
  230. k1++
  231. if k1 == len(set1) {
  232. break mainwhile
  233. }
  234. s1 = set1[k1]
  235. if s1 >= s2 {
  236. break
  237. }
  238. }
  239. } else {
  240. // (set2[k2] == set1[k1])
  241. return true
  242. }
  243. }
  244. return false
  245. }
  246. func localintersect2by2(
  247. set1 []uint16,
  248. set2 []uint16,
  249. buffer []uint16) int {
  250. if (0 == len(set1)) || (0 == len(set2)) {
  251. return 0
  252. }
  253. k1 := 0
  254. k2 := 0
  255. pos := 0
  256. buffer = buffer[:cap(buffer)]
  257. s1 := set1[k1]
  258. s2 := set2[k2]
  259. mainwhile:
  260. for {
  261. if s2 < s1 {
  262. for {
  263. k2++
  264. if k2 == len(set2) {
  265. break mainwhile
  266. }
  267. s2 = set2[k2]
  268. if s2 >= s1 {
  269. break
  270. }
  271. }
  272. }
  273. if s1 < s2 {
  274. for {
  275. k1++
  276. if k1 == len(set1) {
  277. break mainwhile
  278. }
  279. s1 = set1[k1]
  280. if s1 >= s2 {
  281. break
  282. }
  283. }
  284. } else {
  285. // (set2[k2] == set1[k1])
  286. buffer[pos] = s1
  287. pos++
  288. k1++
  289. if k1 == len(set1) {
  290. break
  291. }
  292. s1 = set1[k1]
  293. k2++
  294. if k2 == len(set2) {
  295. break
  296. }
  297. s2 = set2[k2]
  298. }
  299. }
  300. return pos
  301. }
  302. func localintersect2by2Cardinality(
  303. set1 []uint16,
  304. set2 []uint16) int {
  305. if (0 == len(set1)) || (0 == len(set2)) {
  306. return 0
  307. }
  308. k1 := 0
  309. k2 := 0
  310. pos := 0
  311. s1 := set1[k1]
  312. s2 := set2[k2]
  313. mainwhile:
  314. for {
  315. if s2 < s1 {
  316. for {
  317. k2++
  318. if k2 == len(set2) {
  319. break mainwhile
  320. }
  321. s2 = set2[k2]
  322. if s2 >= s1 {
  323. break
  324. }
  325. }
  326. }
  327. if s1 < s2 {
  328. for {
  329. k1++
  330. if k1 == len(set1) {
  331. break mainwhile
  332. }
  333. s1 = set1[k1]
  334. if s1 >= s2 {
  335. break
  336. }
  337. }
  338. } else {
  339. // (set2[k2] == set1[k1])
  340. pos++
  341. k1++
  342. if k1 == len(set1) {
  343. break
  344. }
  345. s1 = set1[k1]
  346. k2++
  347. if k2 == len(set2) {
  348. break
  349. }
  350. s2 = set2[k2]
  351. }
  352. }
  353. return pos
  354. }
  355. func advanceUntil(
  356. array []uint16,
  357. pos int,
  358. length int,
  359. min uint16) int {
  360. lower := pos + 1
  361. if lower >= length || array[lower] >= min {
  362. return lower
  363. }
  364. spansize := 1
  365. for lower+spansize < length && array[lower+spansize] < min {
  366. spansize *= 2
  367. }
  368. var upper int
  369. if lower+spansize < length {
  370. upper = lower + spansize
  371. } else {
  372. upper = length - 1
  373. }
  374. if array[upper] == min {
  375. return upper
  376. }
  377. if array[upper] < min {
  378. // means
  379. // array
  380. // has no
  381. // item
  382. // >= min
  383. // pos = array.length;
  384. return length
  385. }
  386. // we know that the next-smallest span was too small
  387. lower += (spansize >> 1)
  388. mid := 0
  389. for lower+1 != upper {
  390. mid = (lower + upper) >> 1
  391. if array[mid] == min {
  392. return mid
  393. } else if array[mid] < min {
  394. lower = mid
  395. } else {
  396. upper = mid
  397. }
  398. }
  399. return upper
  400. }
  401. func onesidedgallopingintersect2by2(
  402. smallset []uint16,
  403. largeset []uint16,
  404. buffer []uint16) int {
  405. if 0 == len(smallset) {
  406. return 0
  407. }
  408. buffer = buffer[:cap(buffer)]
  409. k1 := 0
  410. k2 := 0
  411. pos := 0
  412. s1 := largeset[k1]
  413. s2 := smallset[k2]
  414. mainwhile:
  415. for {
  416. if s1 < s2 {
  417. k1 = advanceUntil(largeset, k1, len(largeset), s2)
  418. if k1 == len(largeset) {
  419. break mainwhile
  420. }
  421. s1 = largeset[k1]
  422. }
  423. if s2 < s1 {
  424. k2++
  425. if k2 == len(smallset) {
  426. break mainwhile
  427. }
  428. s2 = smallset[k2]
  429. } else {
  430. buffer[pos] = s2
  431. pos++
  432. k2++
  433. if k2 == len(smallset) {
  434. break
  435. }
  436. s2 = smallset[k2]
  437. k1 = advanceUntil(largeset, k1, len(largeset), s2)
  438. if k1 == len(largeset) {
  439. break mainwhile
  440. }
  441. s1 = largeset[k1]
  442. }
  443. }
  444. return pos
  445. }
  446. func onesidedgallopingintersect2by2Cardinality(
  447. smallset []uint16,
  448. largeset []uint16) int {
  449. if 0 == len(smallset) {
  450. return 0
  451. }
  452. k1 := 0
  453. k2 := 0
  454. pos := 0
  455. s1 := largeset[k1]
  456. s2 := smallset[k2]
  457. mainwhile:
  458. for {
  459. if s1 < s2 {
  460. k1 = advanceUntil(largeset, k1, len(largeset), s2)
  461. if k1 == len(largeset) {
  462. break mainwhile
  463. }
  464. s1 = largeset[k1]
  465. }
  466. if s2 < s1 {
  467. k2++
  468. if k2 == len(smallset) {
  469. break mainwhile
  470. }
  471. s2 = smallset[k2]
  472. } else {
  473. pos++
  474. k2++
  475. if k2 == len(smallset) {
  476. break
  477. }
  478. s2 = smallset[k2]
  479. k1 = advanceUntil(largeset, k1, len(largeset), s2)
  480. if k1 == len(largeset) {
  481. break mainwhile
  482. }
  483. s1 = largeset[k1]
  484. }
  485. }
  486. return pos
  487. }
  488. func binarySearch(array []uint16, ikey uint16) int {
  489. low := 0
  490. high := len(array) - 1
  491. for low+16 <= high {
  492. middleIndex := int(uint32(low+high) >> 1)
  493. middleValue := array[middleIndex]
  494. if middleValue < ikey {
  495. low = middleIndex + 1
  496. } else if middleValue > ikey {
  497. high = middleIndex - 1
  498. } else {
  499. return middleIndex
  500. }
  501. }
  502. for ; low <= high; low++ {
  503. val := array[low]
  504. if val >= ikey {
  505. if val == ikey {
  506. return low
  507. }
  508. break
  509. }
  510. }
  511. return -(low + 1)
  512. }