From 2599eed65d15d41f9a3ac45a5357dd248486b618 Mon Sep 17 00:00:00 2001 From: Oleg Pipikin Date: Fri, 2 Aug 2024 13:38:47 +0200 Subject: [PATCH] Move tokenizers_relative_to_genai impl to cpp from header (#728) --- src/cpp/src/tokenizers_path.cpp | 73 +++++++++++++++++++++++++++++++++ src/cpp/src/tokenizers_path.hpp | 71 ++------------------------------ 2 files changed, 77 insertions(+), 67 deletions(-) create mode 100644 src/cpp/src/tokenizers_path.cpp diff --git a/src/cpp/src/tokenizers_path.cpp b/src/cpp/src/tokenizers_path.cpp new file mode 100644 index 0000000000..e7ad89af7d --- /dev/null +++ b/src/cpp/src/tokenizers_path.cpp @@ -0,0 +1,73 @@ +// Copyright (C) 2024 Intel Corporation +// SPDX-License-Identifier: Apache-2.0 + +#include "tokenizers_path.hpp" + +#include +#ifdef _WIN32 +# include +# define MAX_ABS_PATH _MAX_PATH +# define get_absolute_path(result, path) _fullpath(result, path.c_str(), MAX_ABS_PATH) +#else +# include +# include +# include +# define MAX_ABS_PATH PATH_MAX +# define get_absolute_path(result, path) realpath(path.c_str(), result) +#endif + +namespace { +#ifndef _WIN32 +std::string get_absolute_file_path(const std::string& path) { + std::string absolutePath; + absolutePath.resize(MAX_ABS_PATH); + std::ignore = get_absolute_path(&absolutePath[0], path); + if (!absolutePath.empty()) { + // on Linux if file does not exist or no access, function will return NULL, but + // `absolutePath` will contain resolved path + absolutePath.resize(absolutePath.find('\0')); + return std::string(absolutePath); + } + std::stringstream ss; + ss << "Can't get absolute file path for [" << path << "], err = " << strerror(errno); + throw std::runtime_error(ss.str()); +} +#endif + +std::string get_ov_genai_library_path() { +#ifdef _WIN32 + CHAR genai_library_path[MAX_PATH]; + HMODULE hm = NULL; + if (!GetModuleHandleExA(GET_MODULE_HANDLE_EX_FLAG_FROM_ADDRESS | GET_MODULE_HANDLE_EX_FLAG_UNCHANGED_REFCOUNT, + reinterpret_cast(get_ov_genai_library_path), + &hm)) { + std::stringstream ss; + ss << "GetModuleHandle returned " << GetLastError(); + throw std::runtime_error(ss.str()); + } + GetModuleFileNameA(hm, (LPSTR)genai_library_path, sizeof(genai_library_path)); + return std::string(genai_library_path); +#elif defined(__APPLE__) || defined(__linux__) || defined(__EMSCRIPTEN__) + Dl_info info; + dladdr(reinterpret_cast(get_ov_genai_library_path), &info); + return get_absolute_file_path(info.dli_fname).c_str(); +#else +# error "Unsupported OS" +#endif // _WIN32 +} + +std::filesystem::path with_openvino_tokenizers(const std::filesystem::path& path) { +#ifdef _WIN32 + constexpr char tokenizers[] = "openvino_tokenizers.dll"; +#elif __linux__ + constexpr char tokenizers[] = "libopenvino_tokenizers.so"; +#elif __APPLE__ + constexpr char tokenizers[] = "libopenvino_tokenizers.dylib"; +#endif + return path.parent_path() / tokenizers; +} +} + +std::filesystem::path tokenizers_relative_to_genai() { + return with_openvino_tokenizers(get_ov_genai_library_path()); +} diff --git a/src/cpp/src/tokenizers_path.hpp b/src/cpp/src/tokenizers_path.hpp index 4899daccc4..5557b099f1 100644 --- a/src/cpp/src/tokenizers_path.hpp +++ b/src/cpp/src/tokenizers_path.hpp @@ -4,71 +4,8 @@ #pragma once #include -#include -#ifdef _WIN32 -# include -# define MAX_ABS_PATH _MAX_PATH -# define get_absolute_path(result, path) _fullpath(result, path.c_str(), MAX_ABS_PATH) -#else -# include -# include -# define MAX_ABS_PATH PATH_MAX -# define get_absolute_path(result, path) realpath(path.c_str(), result) -namespace { -std::string get_absolute_file_path(const std::string& path) { - std::string absolutePath; - absolutePath.resize(MAX_ABS_PATH); - std::ignore = get_absolute_path(&absolutePath[0], path); - if (!absolutePath.empty()) { - // on Linux if file does not exist or no access, function will return NULL, but - // `absolutePath` will contain resolved path - absolutePath.resize(absolutePath.find('\0')); - return std::string(absolutePath); - } - std::stringstream ss; - ss << "Can't get absolute file path for [" << path << "], err = " << strerror(errno); - throw std::runtime_error(ss.str()); -} -} -#endif - -// These utilites are used in openvino_genai library and python -// bindings. Put in anonymous namespace to avoid exposing the utilites -// but compile them twice. -namespace { -std::string get_ov_genai_library_path() { -#ifdef _WIN32 - CHAR genai_library_path[MAX_PATH]; - HMODULE hm = NULL; - if (!GetModuleHandleExA(GET_MODULE_HANDLE_EX_FLAG_FROM_ADDRESS | GET_MODULE_HANDLE_EX_FLAG_UNCHANGED_REFCOUNT, - reinterpret_cast(get_ov_genai_library_path), - &hm)) { - std::stringstream ss; - ss << "GetModuleHandle returned " << GetLastError(); - throw std::runtime_error(ss.str()); - } - GetModuleFileNameA(hm, (LPSTR)genai_library_path, sizeof(genai_library_path)); - return std::string(genai_library_path); -#elif defined(__APPLE__) || defined(__linux__) || defined(__EMSCRIPTEN__) - Dl_info info; - dladdr(reinterpret_cast(get_ov_genai_library_path), &info); - return get_absolute_file_path(info.dli_fname).c_str(); -#else -# error "Unsupported OS" -#endif // _WIN32 -} - -std::filesystem::path with_openvino_tokenizers(const std::filesystem::path& path) { -#ifdef _WIN32 - constexpr char tokenizers[] = "openvino_tokenizers.dll"; -#elif __linux__ - constexpr char tokenizers[] = "libopenvino_tokenizers.so"; -#elif __APPLE__ - constexpr char tokenizers[] = "libopenvino_tokenizers.dylib"; -#endif - return path.parent_path() / tokenizers; -} +#include "openvino/genai/visibility.hpp" // Returns an absolute path. The path is this library's directory // concatenated with openvino_tokenizers OS specific @@ -77,10 +14,10 @@ std::filesystem::path with_openvino_tokenizers(const std::filesystem::path& path // tokenizers_relative_to_genai() and ScopedVar allow passing a path to // openvino_tokenizers through env var removing one argument from // Tokenizer's constructor. -std::filesystem::path tokenizers_relative_to_genai() { - return with_openvino_tokenizers(get_ov_genai_library_path()); -} +OPENVINO_GENAI_EXPORTS +std::filesystem::path tokenizers_relative_to_genai(); +namespace { // Sets ENVIRONMENT_VARIABLE_NAME to environment_variable_value // and unsets in destructor. Does nothing if ENVIRONMENT_VARIABLE_NAME // was already defined.