diff --git a/docs/docs/cpp.md b/docs/docs/cpp.md index d92d9137d..2adc06848 100644 --- a/docs/docs/cpp.md +++ b/docs/docs/cpp.md @@ -418,6 +418,23 @@ Status HashPartition(std::shared_ptr &table, */ Status Sort(std::shared_ptr &table, int sort_column, std::shared_ptr &output); +/** + * Distributed sort the table according to the given column + * @param sort_column + * @return new table sorted according to the sort column + */ +struct SortOptions { + bool ascending; + uint32_t num_bins; + uint64_t num_samples; + + static SortOptions Defaults(); +}; +Status DistributedSort(std::shared_ptr &table, + int sort_column, + std::shared_ptr
&output, + SortOptions sort_options = SortOptions::Defaults()); + /** * Filters out rows based on the selector function * @param table diff --git a/docs/docs/pub.md b/docs/docs/pub.md index 7ab628743..25e641f0b 100644 --- a/docs/docs/pub.md +++ b/docs/docs/pub.md @@ -24,3 +24,13 @@ year={2020} year={2020} } ``` + +- A Fast, Scalable, Universal Approach For Distributed Data Reductions +``` +@article{perera2020fast, + title={A Fast, Scalable, Universal Approach For Distributed Data Reductions}, + author={Perera, Niranda and Abeykoon, Vibhatha and Widanage, Chathura and Kamburugamuve, Supun and Kanewala, Thejaka Amila and Wickramasinghe, Pulasthi and Uyar, Ahmet and Maithree, Hasara and Lenadora, Damitha and Fox, Geoffrey}, + journal={arXiv preprint arXiv:2010.14596}, + year={2020} +} +``` diff --git a/docs/docs/release/cylon_release_0.3.0.md b/docs/docs/release/cylon_release_0.3.0.md new file mode 100644 index 000000000..700939d4a --- /dev/null +++ b/docs/docs/release/cylon_release_0.3.0.md @@ -0,0 +1,47 @@ +--- +id: 0.3.0 +title: Cylon Release 0.3.0 +sidebar_label: Cylon Release 0.3.0 +--- + +Cylon 0.3.0 adds the following features. Please note that this release may not be backward + compatible with previous releases. + +## Major Features + +### C++ + +- Adding order-by and distributed table sort operations +- Multiple partitioning schemes (modulo, hash and range) +- C++ API refactoring +- Performance improvements in the existing C++ API + +### Python (Pycylon) + +- Exposing table operators similar to Pandas (28 new operators). + - Comparison operators + - Logical Operators + - Math operators + - Null/NA value filtering and filling + - Filtering and updating (including inplace ops) + - Schema refactoring + - Experimental indexing abstract +- Distributed Data sorting Python bindings +- Adding new examples for updated operations. (https://github.com/cylondata/cylon/tree/master/python/examples) + + +### Java (JCylon) + +- Performance improvements + +You can download source code from [Github](https://github.com/cylondata/cylon/releases) + +## Examples + +- [C++ examples](https://github.com/cylondata/cylon/tree/0.3.0/cpp/src/examples) +- [Python examples](https://github.com/cylondata/cylon/tree/0.3.0/python/examples) +- [Java examples](https://github.com/cylondata/cylon/tree/0.3.0/java/src/main/java/org/cylondata/cylon/examples) + +## License + +Licensed under the Apache License, Version 2.0: http://www.apache.org/licenses/LICENSE-2.0 \ No newline at end of file