-
Notifications
You must be signed in to change notification settings - Fork 5.2k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #4860 from kinaryml:c-language-detector-api
PiperOrigin-RevId: 572385111
- Loading branch information
Showing
8 changed files
with
560 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
56 changes: 56 additions & 0 deletions
56
mediapipe/tasks/c/components/containers/language_detection_result_converter.cc
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,56 @@ | ||
/* Copyright 2023 The MediaPipe Authors. | ||
Licensed under the Apache License, Version 2.0 (the "License"); | ||
you may not use this file except in compliance with the License. | ||
You may obtain a copy of the License at | ||
http://www.apache.org/licenses/LICENSE-2.0 | ||
Unless required by applicable law or agreed to in writing, software | ||
distributed under the License is distributed on an "AS IS" BASIS, | ||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
See the License for the specific language governing permissions and | ||
limitations under the License. | ||
==============================================================================*/ | ||
|
||
#include "mediapipe/tasks/c/components/containers/language_detection_result_converter.h" | ||
|
||
#include <cstdint> | ||
#include <cstdlib> | ||
|
||
#include "mediapipe/tasks/c/text/language_detector/language_detector.h" | ||
#include "mediapipe/tasks/cc/text/language_detector/language_detector.h" | ||
|
||
namespace mediapipe::tasks::c::components::containers { | ||
|
||
void CppConvertToLanguageDetectionResult( | ||
const mediapipe::tasks::text::language_detector::LanguageDetectorResult& in, | ||
LanguageDetectorResult* out) { | ||
out->predictions_count = in.size(); | ||
out->predictions = | ||
out->predictions_count | ||
? new LanguageDetectorPrediction[out->predictions_count] | ||
: nullptr; | ||
|
||
for (uint32_t i = 0; i < out->predictions_count; ++i) { | ||
auto language_detection_prediction_in = in[i]; | ||
auto& language_detection_prediction_out = out->predictions[i]; | ||
language_detection_prediction_out.probability = | ||
language_detection_prediction_in.probability; | ||
language_detection_prediction_out.language_code = | ||
strdup(language_detection_prediction_in.language_code.c_str()); | ||
} | ||
} | ||
|
||
void CppCloseLanguageDetectionResult(LanguageDetectorResult* in) { | ||
for (uint32_t i = 0; i < in->predictions_count; ++i) { | ||
auto prediction_in = in->predictions[i]; | ||
|
||
free(prediction_in.language_code); | ||
prediction_in.language_code = nullptr; | ||
} | ||
delete[] in->predictions; | ||
in->predictions = nullptr; | ||
} | ||
|
||
} // namespace mediapipe::tasks::c::components::containers |
32 changes: 32 additions & 0 deletions
32
mediapipe/tasks/c/components/containers/language_detection_result_converter.h
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,32 @@ | ||
/* Copyright 2023 The MediaPipe Authors. | ||
Licensed under the Apache License, Version 2.0 (the "License"); | ||
you may not use this file except in compliance with the License. | ||
You may obtain a copy of the License at | ||
http://www.apache.org/licenses/LICENSE-2.0 | ||
Unless required by applicable law or agreed to in writing, software | ||
distributed under the License is distributed on an "AS IS" BASIS, | ||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
See the License for the specific language governing permissions and | ||
limitations under the License. | ||
==============================================================================*/ | ||
|
||
#ifndef MEDIAPIPE_TASKS_C_COMPONENTS_CONTAINERS_LANGUAGE_DETECTION_RESULT_CONVERTER_H_ | ||
#define MEDIAPIPE_TASKS_C_COMPONENTS_CONTAINERS_LANGUAGE_DETECTION_RESULT_CONVERTER_H_ | ||
|
||
#include "mediapipe/tasks/c/text/language_detector/language_detector.h" | ||
#include "mediapipe/tasks/cc/text/language_detector/language_detector.h" | ||
|
||
namespace mediapipe::tasks::c::components::containers { | ||
|
||
void CppConvertToLanguageDetectionResult( | ||
const mediapipe::tasks::text::language_detector::LanguageDetectorResult& in, | ||
LanguageDetectorResult* out); | ||
|
||
void CppCloseLanguageDetectionResult(LanguageDetectorResult* in); | ||
|
||
} // namespace mediapipe::tasks::c::components::containers | ||
|
||
#endif // MEDIAPIPE_TASKS_C_COMPONENTS_CONTAINERS_LANGUAGE_DETECTION_RESULT_CONVERTER_H_ |
54 changes: 54 additions & 0 deletions
54
mediapipe/tasks/c/components/containers/language_detection_result_converter_test.cc
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,54 @@ | ||
/* Copyright 2023 The MediaPipe Authors. | ||
Licensed under the Apache License, Version 2.0 (the "License"); | ||
you may not use this file except in compliance with the License. | ||
You may obtain a copy of the License at | ||
http://www.apache.org/licenses/LICENSE-2.0 | ||
Unless required by applicable law or agreed to in writing, software | ||
distributed under the License is distributed on an "AS IS" BASIS, | ||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
See the License for the specific language governing permissions and | ||
limitations under the License. | ||
==============================================================================*/ | ||
|
||
#include "mediapipe/tasks/c/components/containers/language_detection_result_converter.h" | ||
|
||
#include "mediapipe/framework/port/gtest.h" | ||
#include "mediapipe/tasks/c/text/language_detector/language_detector.h" | ||
#include "mediapipe/tasks/cc/text/language_detector/language_detector.h" | ||
|
||
namespace mediapipe::tasks::c::components::containers { | ||
|
||
TEST(LanguageDetectionResultConverterTest, | ||
ConvertsLanguageDetectionResultCustomResult) { | ||
mediapipe::tasks::text::language_detector::LanguageDetectorResult | ||
cpp_detector_result = {{/* language_code= */ "fr", | ||
/* probability= */ 0.5}, | ||
{/* language_code= */ "en", | ||
/* probability= */ 0.5}}; | ||
|
||
LanguageDetectorResult c_detector_result; | ||
CppConvertToLanguageDetectionResult(cpp_detector_result, &c_detector_result); | ||
EXPECT_NE(c_detector_result.predictions, nullptr); | ||
EXPECT_EQ(c_detector_result.predictions_count, 2); | ||
EXPECT_NE(c_detector_result.predictions[0].language_code, "fr"); | ||
EXPECT_EQ(c_detector_result.predictions[0].probability, 0.5); | ||
|
||
CppCloseLanguageDetectionResult(&c_detector_result); | ||
} | ||
|
||
TEST(LanguageDetectionResultConverterTest, FreesMemory) { | ||
mediapipe::tasks::text::language_detector::LanguageDetectorResult | ||
cpp_detector_result = {{"fr", 0.5}}; | ||
|
||
LanguageDetectorResult c_detector_result; | ||
CppConvertToLanguageDetectionResult(cpp_detector_result, &c_detector_result); | ||
EXPECT_NE(c_detector_result.predictions, nullptr); | ||
|
||
CppCloseLanguageDetectionResult(&c_detector_result); | ||
EXPECT_EQ(c_detector_result.predictions, nullptr); | ||
} | ||
|
||
} // namespace mediapipe::tasks::c::components::containers |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,93 @@ | ||
# Copyright 2023 The MediaPipe Authors. | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
package(default_visibility = ["//mediapipe/tasks:internal"]) | ||
|
||
licenses(["notice"]) | ||
|
||
cc_library( | ||
name = "language_detector_lib", | ||
srcs = ["language_detector.cc"], | ||
hdrs = ["language_detector.h"], | ||
visibility = ["//visibility:public"], | ||
deps = [ | ||
"//mediapipe/tasks/c/components/containers:language_detection_result_converter", | ||
"//mediapipe/tasks/c/components/processors:classifier_options", | ||
"//mediapipe/tasks/c/components/processors:classifier_options_converter", | ||
"//mediapipe/tasks/c/core:base_options", | ||
"//mediapipe/tasks/c/core:base_options_converter", | ||
"//mediapipe/tasks/cc/text/language_detector", | ||
"@com_google_absl//absl/log:absl_log", | ||
"@com_google_absl//absl/status", | ||
], | ||
alwayslink = 1, | ||
) | ||
|
||
# bazel build -c opt --linkopt -s --strip always --define MEDIAPIPE_DISABLE_GPU=1 \ | ||
# //mediapipe/tasks/c/text/language_detector:liblanguage_detector.so | ||
cc_binary( | ||
name = "liblanguage_detector.so", | ||
linkopts = [ | ||
"-Wl,-soname=liblanguage_detector.so", | ||
"-fvisibility=hidden", | ||
], | ||
linkshared = True, | ||
tags = [ | ||
"manual", | ||
"nobuilder", | ||
"notap", | ||
], | ||
deps = [":language_detector_lib"], | ||
) | ||
|
||
# bazel build --config darwin_arm64 -c opt --strip always --define MEDIAPIPE_DISABLE_GPU=1 \ | ||
# //mediapipe/tasks/c/text/language_detector:liblanguage_detector.dylib | ||
cc_binary( | ||
name = "liblanguage_detector.dylib", | ||
linkopts = [ | ||
"-Wl,-install_name,liblanguage_detector.dylib", | ||
"-fvisibility=hidden", | ||
], | ||
linkshared = True, | ||
tags = [ | ||
"manual", | ||
"nobuilder", | ||
"notap", | ||
], | ||
deps = [":language_detector_lib"], | ||
) | ||
|
||
cc_library( | ||
name = "language_detector", | ||
hdrs = ["language_detector.h"], | ||
deps = [ | ||
"//mediapipe/tasks/c/components/processors:classifier_options", | ||
"//mediapipe/tasks/c/core:base_options", | ||
], | ||
) | ||
|
||
cc_test( | ||
name = "language_detector_test", | ||
srcs = ["language_detector_test.cc"], | ||
data = ["//mediapipe/tasks/testdata/text:language_detector"], | ||
linkstatic = 1, | ||
deps = [ | ||
":language_detector_lib", | ||
"//mediapipe/framework/deps:file_path", | ||
"//mediapipe/framework/port:gtest", | ||
"@com_google_absl//absl/flags:flag", | ||
"@com_google_absl//absl/strings", | ||
"@com_google_googletest//:gtest_main", | ||
], | ||
) |
124 changes: 124 additions & 0 deletions
124
mediapipe/tasks/c/text/language_detector/language_detector.cc
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,124 @@ | ||
/* Copyright 2023 The MediaPipe Authors. | ||
Licensed under the Apache License, Version 2.0 (the "License"); | ||
you may not use this file except in compliance with the License. | ||
You may obtain a copy of the License at | ||
http://www.apache.org/licenses/LICENSE-2.0 | ||
Unless required by applicable law or agreed to in writing, software | ||
distributed under the License is distributed on an "AS IS" BASIS, | ||
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
See the License for the specific language governing permissions and | ||
limitations under the License. | ||
==============================================================================*/ | ||
|
||
#include "mediapipe/tasks/c/text/language_detector/language_detector.h" | ||
|
||
#include <memory> | ||
#include <utility> | ||
|
||
#include "absl/log/absl_log.h" | ||
#include "absl/status/status.h" | ||
#include "mediapipe/tasks/c/components/containers/language_detection_result_converter.h" | ||
#include "mediapipe/tasks/c/components/processors/classifier_options_converter.h" | ||
#include "mediapipe/tasks/c/core/base_options_converter.h" | ||
#include "mediapipe/tasks/cc/text/language_detector/language_detector.h" | ||
|
||
namespace mediapipe::tasks::c::text::language_detector { | ||
|
||
namespace { | ||
|
||
using ::mediapipe::tasks::c::components::containers:: | ||
CppCloseLanguageDetectionResult; | ||
using ::mediapipe::tasks::c::components::containers:: | ||
CppConvertToLanguageDetectionResult; | ||
using ::mediapipe::tasks::c::components::processors:: | ||
CppConvertToClassifierOptions; | ||
using ::mediapipe::tasks::c::core::CppConvertToBaseOptions; | ||
using ::mediapipe::tasks::text::language_detector::LanguageDetector; | ||
|
||
int CppProcessError(absl::Status status, char** error_msg) { | ||
if (error_msg) { | ||
*error_msg = strdup(status.ToString().c_str()); | ||
} | ||
return status.raw_code(); | ||
} | ||
|
||
} // namespace | ||
|
||
LanguageDetector* CppLanguageDetectorCreate( | ||
const LanguageDetectorOptions& options, char** error_msg) { | ||
auto cpp_options = std::make_unique< | ||
::mediapipe::tasks::text::language_detector::LanguageDetectorOptions>(); | ||
|
||
CppConvertToBaseOptions(options.base_options, &cpp_options->base_options); | ||
CppConvertToClassifierOptions(options.classifier_options, | ||
&cpp_options->classifier_options); | ||
|
||
auto detector = LanguageDetector::Create(std::move(cpp_options)); | ||
if (!detector.ok()) { | ||
ABSL_LOG(ERROR) << "Failed to create LanguageDetector: " | ||
<< detector.status(); | ||
CppProcessError(detector.status(), error_msg); | ||
return nullptr; | ||
} | ||
return detector->release(); | ||
} | ||
|
||
int CppLanguageDetectorDetect(void* detector, const char* utf8_str, | ||
LanguageDetectorResult* result, | ||
char** error_msg) { | ||
auto cpp_detector = static_cast<LanguageDetector*>(detector); | ||
auto cpp_result = cpp_detector->Detect(utf8_str); | ||
if (!cpp_result.ok()) { | ||
ABSL_LOG(ERROR) << "Language Detection failed: " << cpp_result.status(); | ||
return CppProcessError(cpp_result.status(), error_msg); | ||
} | ||
|
||
CppConvertToLanguageDetectionResult(*cpp_result, result); | ||
return 0; | ||
} | ||
|
||
void CppLanguageDetectorCloseResult(LanguageDetectorResult* result) { | ||
CppCloseLanguageDetectionResult(result); | ||
} | ||
|
||
int CppLanguageDetectorClose(void* detector, char** error_msg) { | ||
auto cpp_detector = static_cast<LanguageDetector*>(detector); | ||
auto result = cpp_detector->Close(); | ||
if (!result.ok()) { | ||
ABSL_LOG(ERROR) << "Failed to close LanguageDetector: " << result; | ||
return CppProcessError(result, error_msg); | ||
} | ||
delete cpp_detector; | ||
return 0; | ||
} | ||
|
||
} // namespace mediapipe::tasks::c::text::language_detector | ||
|
||
extern "C" { | ||
|
||
void* language_detector_create(struct LanguageDetectorOptions* options, | ||
char** error_msg) { | ||
return mediapipe::tasks::c::text::language_detector:: | ||
CppLanguageDetectorCreate(*options, error_msg); | ||
} | ||
|
||
int language_detector_detect(void* detector, const char* utf8_str, | ||
LanguageDetectorResult* result, char** error_msg) { | ||
return mediapipe::tasks::c::text::language_detector:: | ||
CppLanguageDetectorDetect(detector, utf8_str, result, error_msg); | ||
} | ||
|
||
void language_detector_close_result(LanguageDetectorResult* result) { | ||
mediapipe::tasks::c::text::language_detector::CppLanguageDetectorCloseResult( | ||
result); | ||
} | ||
|
||
int language_detector_close(void* detector, char** error_ms) { | ||
return mediapipe::tasks::c::text::language_detector::CppLanguageDetectorClose( | ||
detector, error_ms); | ||
} | ||
|
||
} // extern "C" |
Oops, something went wrong.