Skip to content

Commit

Permalink
Remove unused parsing utilities (#15955)
Browse files Browse the repository at this point in the history
Some parsing utilities have been unused since legacy JSON removal.
This PR removes these functions.

Authors:
  - Vukasin Milovanovic (https://github.com/vuule)

Approvers:
  - Bradley Dice (https://github.com/bdice)
  - Nghia Truong (https://github.com/ttnghia)
  - Vyas Ramasubramani (https://github.com/vyasr)

URL: #15955
  • Loading branch information
vuule authored Jun 7, 2024
1 parent 139ed6c commit 8e40fe7
Show file tree
Hide file tree
Showing 3 changed files with 0 additions and 298 deletions.
1 change: 0 additions & 1 deletion cpp/CMakeLists.txt
Original file line number Diff line number Diff line change
Expand Up @@ -439,7 +439,6 @@ add_library(
src/io/utilities/data_sink.cpp
src/io/utilities/datasource.cpp
src/io/utilities/file_io_utilities.cpp
src/io/utilities/parsing_utils.cu
src/io/utilities/row_selection.cpp
src/io/utilities/type_inference.cu
src/io/utilities/trie.cu
Expand Down
221 changes: 0 additions & 221 deletions cpp/src/io/utilities/parsing_utils.cu

This file was deleted.

76 changes: 0 additions & 76 deletions cpp/src/io/utilities/parsing_utils.cuh
Original file line number Diff line number Diff line change
Expand Up @@ -414,82 +414,6 @@ __device__ __inline__ cudf::size_type* infer_integral_field_counter(char const*

} // namespace gpu

/**
* @brief Searches the input character array for each of characters in a set.
* Sums up the number of occurrences. If the 'positions' parameter is not void*,
* positions of all occurrences are stored in the output device array.
*
* @param[in] d_data Input character array in device memory
* @param[in] keys Vector containing the keys to count in the buffer
* @param[in] result_offset Offset to add to the output positions
* @param[out] positions Array containing the output positions
* @param[in] stream CUDA stream used for device memory operations and kernel launches
*
* @return cudf::size_type total number of occurrences
*/
template <class T>
cudf::size_type find_all_from_set(device_span<char const> data,
std::vector<char> const& keys,
uint64_t result_offset,
T* positions,
rmm::cuda_stream_view stream);

/**
* @brief Searches the input character array for each of characters in a set.
* Sums up the number of occurrences. If the 'positions' parameter is not void*,
* positions of all occurrences are stored in the output device array.
*
* Does not load the entire file into the GPU memory at any time, so it can
* be used to parse large files. Output array needs to be preallocated.
*
* @param[in] h_data Pointer to the input character array
* @param[in] h_size Number of bytes in the input array
* @param[in] keys Vector containing the keys to count in the buffer
* @param[in] result_offset Offset to add to the output positions
* @param[out] positions Array containing the output positions
* @param[in] stream CUDA stream used for device memory operations and kernel launches
*
* @return cudf::size_type total number of occurrences
*/
template <class T>
cudf::size_type find_all_from_set(host_span<char const> data,
std::vector<char> const& keys,
uint64_t result_offset,
T* positions,
rmm::cuda_stream_view stream);

/**
* @brief Searches the input character array for each of characters in a set
* and sums up the number of occurrences.
*
* @param d_data Input data buffer in device memory
* @param keys Vector containing the keys to count in the buffer
* @param stream CUDA stream used for device memory operations and kernel launches
*
* @return cudf::size_type total number of occurrences
*/
cudf::size_type count_all_from_set(device_span<char const> data,
std::vector<char> const& keys,
rmm::cuda_stream_view stream);

/**
* @brief Searches the input character array for each of characters in a set
* and sums up the number of occurrences.
*
* Does not load the entire buffer into the GPU memory at any time, so it can
* be used with buffers of any size.
*
* @param h_data Pointer to the data in host memory
* @param h_size Size of the input data, in bytes
* @param keys Vector containing the keys to count in the buffer
* @param stream CUDA stream used for device memory operations and kernel launches
*
* @return cudf::size_type total number of occurrences
*/
cudf::size_type count_all_from_set(host_span<char const> data,
std::vector<char> const& keys,
rmm::cuda_stream_view stream);

/**
* @brief Checks whether the given character is a whitespace character.
*
Expand Down

0 comments on commit 8e40fe7

Please sign in to comment.