1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
use super::super::{RadixKey, Radixable};
use super::american_flag_sort::serial_radixsort_rec;
use super::comparative_sort::insertion_sort;
use super::utils::{get_histogram, prefix_sums, Params};

const UNROLL_SIZE: usize = 4;

pub fn ska_swap<T: Radixable<K>, K: RadixKey>(
    arr: &mut [T],
    heads: &mut Vec<usize>,
    tails: &[usize],
    mask: <<T as Radixable<K>>::Key as RadixKey>::Key,
    shift: usize,
) {
    let mut buckets_size = Vec::new();
    for i in 0..heads.len() {
        buckets_size.push((i, tails[i] - heads[i]))
    }
    buckets_size.sort_unstable_by_key(|elt| elt.1);
    buckets_size.pop();

    while !buckets_size.is_empty() {
        let mut to_remove = Vec::new();
        for (i, (computed_index, _)) in buckets_size.iter().enumerate() {
            let span = tails[*computed_index] - heads[*computed_index];

            if span > 0 {
                let offset = heads[*computed_index];
                let quotient = span / UNROLL_SIZE;
                let remainder = span % UNROLL_SIZE;

                for q in 0..quotient {
                    let o = offset + q * UNROLL_SIZE;

                    unsafe {
                        let tb0 = arr.get_unchecked(o).extract(mask, shift);
                        let tb1 = arr.get_unchecked(o + 1).extract(mask, shift);
                        let tb2 = arr.get_unchecked(o + 2).extract(mask, shift);
                        let tb3 = arr.get_unchecked(o + 3).extract(mask, shift);

                        let dest_index_0 = heads[tb0];
                        heads[tb0] += 1;
                        let dest_index_1 = heads[tb1];
                        heads[tb1] += 1;
                        let dest_index_2 = heads[tb2];
                        heads[tb2] += 1;
                        let dest_index_3 = heads[tb3];
                        heads[tb3] += 1;

                        arr.swap(o, dest_index_0);
                        arr.swap(o + 1, dest_index_1);
                        arr.swap(o + 2, dest_index_2);
                        arr.swap(o + 3, dest_index_3);
                    }
                }

                let n_o = offset + UNROLL_SIZE * quotient;

                for i in 0..remainder {
                    unsafe {
                        let b = arr.get_unchecked(n_o + i).extract(mask, shift);
                        arr.swap(n_o + i, heads[b]);
                        heads[b] += 1;
                    }
                }
            } else {
                to_remove.push(i);
            }
        }

        to_remove.reverse();
        for i in to_remove.iter() {
            buckets_size.remove(*i);
        }
    }
}

fn ska_sort_rec<T: Radixable<K>, K: RadixKey>(arr: &mut [T], p: Params) {
    if arr.len() <= 64 {
        insertion_sort(arr);
        return;
    }
    if arr.len() <= 1024 {
        serial_radixsort_rec(arr, p);
        return;
    }

    let dummy = arr[0];
    let (mask, shift) = dummy.get_mask_and_shift_from_left(&p);
    let histogram = get_histogram(arr, &p, mask, shift);
    let (p_sums, mut heads, tails) = prefix_sums(&histogram);

    ska_swap(arr, &mut heads, &tails, mask, shift);

    let mut rest = arr;
    if p.level < p.max_level - 1 {
        for i in 0..(p.radix_range) {
            let bucket_end = p_sums[i + 1] - p_sums[i];
            let (first_part, second_part) = rest.split_at_mut(bucket_end);
            rest = second_part;
            if histogram[i] > 1 {
                let new_params = p.new_level(p.level + 1);
                println!("{:?}", new_params);
                ska_sort_rec(first_part, new_params);
            }
        }
    }
}

/// # Ska sort
///
/// An implementation of the
/// [Ska sort](https://probablydance.com/2016/12/27/i-wrote-a-faster-sorting-algorithm/)
/// algorithm.
///
/// The Ska sort is an in place unstable radix sort.
pub fn ska_sort<T: Radixable<K>, K: RadixKey>(arr: &mut [T], radix: usize) {
    if arr.len() <= 64 {
        insertion_sort(arr);
        return;
    }

    let dummy = arr[0];
    let (offset, _) = dummy.compute_offset(arr, radix);
    let max_level = dummy.compute_max_level(offset, radix);

    if max_level == 0 {
        return;
    }

    let params = Params::new(0, radix, offset, max_level);

    ska_sort_rec(arr, params);
}