You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
189 lines
6.3 KiB
189 lines
6.3 KiB
/*
|
|
* Copyright (C) 2018 The Android Open Source Project
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
#include "lang_id/lang-id_jni.h"
|
|
|
|
#include <jni.h>
|
|
|
|
#include <type_traits>
|
|
#include <vector>
|
|
|
|
#include "lang_id/lang-id-wrapper.h"
|
|
#include "utils/base/logging.h"
|
|
#include "utils/java/jni-helper.h"
|
|
#include "lang_id/fb_model/lang-id-from-fb.h"
|
|
#include "lang_id/lang-id.h"
|
|
|
|
using libtextclassifier3::JniHelper;
|
|
using libtextclassifier3::JStringToUtf8String;
|
|
using libtextclassifier3::ScopedLocalRef;
|
|
using libtextclassifier3::StatusOr;
|
|
using libtextclassifier3::mobile::lang_id::GetLangIdFromFlatbufferFile;
|
|
using libtextclassifier3::mobile::lang_id::GetLangIdFromFlatbufferFileDescriptor;
|
|
using libtextclassifier3::mobile::lang_id::LangId;
|
|
using libtextclassifier3::mobile::lang_id::LangIdResult;
|
|
|
|
namespace {
|
|
|
|
StatusOr<ScopedLocalRef<jobjectArray>> LangIdResultToJObjectArray(
|
|
JNIEnv* env,
|
|
const std::vector<std::pair<std::string, float>>& lang_id_predictions) {
|
|
TC3_ASSIGN_OR_RETURN(
|
|
const ScopedLocalRef<jclass> result_class,
|
|
JniHelper::FindClass(
|
|
env, TC3_PACKAGE_PATH TC3_LANG_ID_CLASS_NAME_STR "$LanguageResult"));
|
|
|
|
TC3_ASSIGN_OR_RETURN(const jmethodID result_class_constructor,
|
|
JniHelper::GetMethodID(env, result_class.get(), "<init>",
|
|
"(Ljava/lang/String;F)V"));
|
|
TC3_ASSIGN_OR_RETURN(
|
|
ScopedLocalRef<jobjectArray> results,
|
|
JniHelper::NewObjectArray(env, lang_id_predictions.size(),
|
|
result_class.get(), nullptr));
|
|
for (int i = 0; i < lang_id_predictions.size(); i++) {
|
|
TC3_ASSIGN_OR_RETURN(
|
|
const ScopedLocalRef<jstring> predicted_language,
|
|
JniHelper::NewStringUTF(env, lang_id_predictions[i].first.c_str()));
|
|
TC3_ASSIGN_OR_RETURN(
|
|
const ScopedLocalRef<jobject> result,
|
|
JniHelper::NewObject(
|
|
env, result_class.get(), result_class_constructor,
|
|
predicted_language.get(),
|
|
static_cast<jfloat>(lang_id_predictions[i].second)));
|
|
JniHelper::SetObjectArrayElement(env, results.get(), i, result.get());
|
|
}
|
|
return results;
|
|
}
|
|
|
|
float GetNoiseThreshold(const LangId& model) {
|
|
return model.GetFloatProperty("text_classifier_langid_noise_threshold", -1.0);
|
|
}
|
|
} // namespace
|
|
|
|
TC3_JNI_METHOD(jlong, TC3_LANG_ID_CLASS_NAME, nativeNew)
|
|
(JNIEnv* env, jobject clazz, jint fd) {
|
|
std::unique_ptr<LangId> lang_id = GetLangIdFromFlatbufferFileDescriptor(fd);
|
|
if (!lang_id->is_valid()) {
|
|
return reinterpret_cast<jlong>(nullptr);
|
|
}
|
|
return reinterpret_cast<jlong>(lang_id.release());
|
|
}
|
|
|
|
TC3_JNI_METHOD(jlong, TC3_LANG_ID_CLASS_NAME, nativeNewFromPath)
|
|
(JNIEnv* env, jobject clazz, jstring path) {
|
|
TC3_ASSIGN_OR_RETURN_0(const std::string path_str,
|
|
JStringToUtf8String(env, path));
|
|
std::unique_ptr<LangId> lang_id = GetLangIdFromFlatbufferFile(path_str);
|
|
if (!lang_id->is_valid()) {
|
|
return reinterpret_cast<jlong>(nullptr);
|
|
}
|
|
return reinterpret_cast<jlong>(lang_id.release());
|
|
}
|
|
|
|
TC3_JNI_METHOD(jlong, TC3_LANG_ID_CLASS_NAME, nativeNewWithOffset)
|
|
(JNIEnv* env, jobject clazz, jint fd, jlong offset, jlong size) {
|
|
std::unique_ptr<LangId> lang_id =
|
|
GetLangIdFromFlatbufferFileDescriptor(fd, offset, size);
|
|
if (!lang_id->is_valid()) {
|
|
return reinterpret_cast<jlong>(nullptr);
|
|
}
|
|
return reinterpret_cast<jlong>(lang_id.release());
|
|
}
|
|
|
|
TC3_JNI_METHOD(jobjectArray, TC3_LANG_ID_CLASS_NAME, nativeDetectLanguages)
|
|
(JNIEnv* env, jobject thiz, jlong ptr, jstring text) {
|
|
LangId* model = reinterpret_cast<LangId*>(ptr);
|
|
if (!model) {
|
|
return nullptr;
|
|
}
|
|
|
|
TC3_ASSIGN_OR_RETURN_NULL(const std::string text_str,
|
|
JStringToUtf8String(env, text));
|
|
|
|
const std::vector<std::pair<std::string, float>>& prediction_results =
|
|
libtextclassifier3::langid::GetPredictions(model, text_str);
|
|
|
|
TC3_ASSIGN_OR_RETURN_NULL(
|
|
ScopedLocalRef<jobjectArray> results,
|
|
LangIdResultToJObjectArray(env, prediction_results));
|
|
return results.release();
|
|
}
|
|
|
|
TC3_JNI_METHOD(void, TC3_LANG_ID_CLASS_NAME, nativeClose)
|
|
(JNIEnv* env, jobject thiz, jlong ptr) {
|
|
if (!ptr) {
|
|
TC3_LOG(ERROR) << "Trying to close null LangId.";
|
|
return;
|
|
}
|
|
LangId* model = reinterpret_cast<LangId*>(ptr);
|
|
delete model;
|
|
}
|
|
|
|
TC3_JNI_METHOD(jint, TC3_LANG_ID_CLASS_NAME, nativeGetVersion)
|
|
(JNIEnv* env, jobject thiz, jlong ptr) {
|
|
if (!ptr) {
|
|
return -1;
|
|
}
|
|
LangId* model = reinterpret_cast<LangId*>(ptr);
|
|
return model->GetModelVersion();
|
|
}
|
|
|
|
TC3_JNI_METHOD(jint, TC3_LANG_ID_CLASS_NAME, nativeGetVersionFromFd)
|
|
(JNIEnv* env, jobject clazz, jint fd) {
|
|
std::unique_ptr<LangId> lang_id = GetLangIdFromFlatbufferFileDescriptor(fd);
|
|
if (!lang_id->is_valid()) {
|
|
return -1;
|
|
}
|
|
return lang_id->GetModelVersion();
|
|
}
|
|
|
|
TC3_JNI_METHOD(jfloat, TC3_LANG_ID_CLASS_NAME, nativeGetLangIdThreshold)
|
|
(JNIEnv* env, jobject thizz, jlong ptr) {
|
|
if (!ptr) {
|
|
return -1.0;
|
|
}
|
|
LangId* model = reinterpret_cast<LangId*>(ptr);
|
|
return model->GetFloatProperty("text_classifier_langid_threshold", -1.0);
|
|
}
|
|
|
|
TC3_JNI_METHOD(jfloat, TC3_LANG_ID_CLASS_NAME, nativeGetLangIdNoiseThreshold)
|
|
(JNIEnv* env, jobject thizz, jlong ptr) {
|
|
if (!ptr) {
|
|
return -1.0;
|
|
}
|
|
LangId* model = reinterpret_cast<LangId*>(ptr);
|
|
return GetNoiseThreshold(*model);
|
|
}
|
|
|
|
TC3_JNI_METHOD(jint, TC3_LANG_ID_CLASS_NAME, nativeGetMinTextSizeInBytes)
|
|
(JNIEnv* env, jobject thizz, jlong ptr) {
|
|
if (!ptr) {
|
|
return 0;
|
|
}
|
|
LangId* model = reinterpret_cast<LangId*>(ptr);
|
|
return model->GetFloatProperty("min_text_size_in_bytes", 0);
|
|
}
|
|
|
|
TC3_JNI_METHOD(jint, TC3_LANG_ID_CLASS_NAME, nativeGetVersionWithOffset)
|
|
(JNIEnv* env, jobject clazz, jint fd, jlong offset, jlong size) {
|
|
std::unique_ptr<LangId> lang_id =
|
|
GetLangIdFromFlatbufferFileDescriptor(fd, offset, size);
|
|
if (!lang_id->is_valid()) {
|
|
return -1;
|
|
}
|
|
return lang_id->GetModelVersion();
|
|
}
|