Andrew Moylan | ff6be51 | 2018-07-03 11:05:01 +1000 | [diff] [blame] | 1 | // Copyright 2018 The Chromium OS Authors. All rights reserved. |
| 2 | // Use of this source code is governed by a BSD-style license that can be |
| 3 | // found in the LICENSE file. |
| 4 | |
| 5 | #include "ml/machine_learning_service_impl.h" |
alanlxl | cb1f856 | 2018-11-01 15:16:11 +1100 | [diff] [blame] | 6 | #include "ml/request_metrics.h" |
Andrew Moylan | ff6be51 | 2018-07-03 11:05:01 +1000 | [diff] [blame] | 7 | |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 8 | #include <memory> |
Andrew Moylan | ff6be51 | 2018-07-03 11:05:01 +1000 | [diff] [blame] | 9 | #include <utility> |
| 10 | |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 11 | #include <base/bind.h> |
| 12 | #include <base/bind_helpers.h> |
Honglin Yu | f33dce3 | 2019-12-05 15:10:39 +1100 | [diff] [blame] | 13 | #include <base/files/file.h> |
| 14 | #include <base/files/file_util.h> |
Michael Martis | 8783c8e | 2019-06-26 17:30:54 +1000 | [diff] [blame] | 15 | #include <tensorflow/lite/model.h> |
Honglin Yu | f33dce3 | 2019-12-05 15:10:39 +1100 | [diff] [blame] | 16 | #include <unicode/putil.h> |
| 17 | #include <unicode/udata.h> |
| 18 | #include <utils/memory/mmap.h> |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 19 | |
charleszhao | 17777f9 | 2020-04-23 12:53:11 +1000 | [diff] [blame] | 20 | #include "ml/handwriting.h" |
charleszhao | 05c5a4a | 2020-06-09 16:49:54 +1000 | [diff] [blame] | 21 | #include "ml/handwriting_path.h" |
charleszhao | 17777f9 | 2020-04-23 12:53:11 +1000 | [diff] [blame] | 22 | #include "ml/handwriting_recognizer_impl.h" |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 23 | #include "ml/model_impl.h" |
charleszhao | 17777f9 | 2020-04-23 12:53:11 +1000 | [diff] [blame] | 24 | #include "ml/mojom/handwriting_recognizer.mojom.h" |
Hidehiko Abe | aa488c3 | 2018-08-31 23:49:41 +0900 | [diff] [blame] | 25 | #include "ml/mojom/model.mojom.h" |
Honglin Yu | f33dce3 | 2019-12-05 15:10:39 +1100 | [diff] [blame] | 26 | #include "ml/text_classifier_impl.h" |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 27 | |
Andrew Moylan | ff6be51 | 2018-07-03 11:05:01 +1000 | [diff] [blame] | 28 | namespace ml { |
| 29 | |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 30 | namespace { |
| 31 | |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 32 | using ::chromeos::machine_learning::mojom::BuiltinModelId; |
| 33 | using ::chromeos::machine_learning::mojom::BuiltinModelSpecPtr; |
| 34 | using ::chromeos::machine_learning::mojom::FlatBufferModelSpecPtr; |
charleszhao | 17777f9 | 2020-04-23 12:53:11 +1000 | [diff] [blame] | 35 | using ::chromeos::machine_learning::mojom::HandwritingRecognizerRequest; |
charleszhao | 05c5a4a | 2020-06-09 16:49:54 +1000 | [diff] [blame] | 36 | using ::chromeos::machine_learning::mojom::HandwritingRecognizerSpec; |
| 37 | using ::chromeos::machine_learning::mojom::HandwritingRecognizerSpecPtr; |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 38 | using ::chromeos::machine_learning::mojom::LoadModelResult; |
Andrew Moylan | 2fb80af | 2020-07-08 10:52:08 +1000 | [diff] [blame] | 39 | using ::chromeos::machine_learning::mojom::MachineLearningServiceRequest; |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 40 | using ::chromeos::machine_learning::mojom::ModelRequest; |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 41 | |
| 42 | constexpr char kSystemModelDir[] = "/opt/google/chrome/ml_models/"; |
Andrew Moylan | 79b34a4 | 2020-07-08 11:13:11 +1000 | [diff] [blame] | 43 | // Base name for UMA metrics related to model loading (`LoadBuiltinModel`, |
| 44 | // `LoadFlatBufferModel`, `LoadTextClassifier` or LoadHandwritingModel). |
Honglin Yu | 6adafcd | 2019-07-22 13:48:11 +1000 | [diff] [blame] | 45 | constexpr char kMetricsRequestName[] = "LoadModelResult"; |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 46 | |
Honglin Yu | f33dce3 | 2019-12-05 15:10:39 +1100 | [diff] [blame] | 47 | constexpr char kTextClassifierModelFile[] = |
| 48 | "mlservice-model-text_classifier_en-v706.fb"; |
| 49 | |
| 50 | constexpr char kIcuDataFilePath[] = "/opt/google/chrome/icudtl.dat"; |
| 51 | |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 52 | } // namespace |
| 53 | |
Andrew Moylan | ff6be51 | 2018-07-03 11:05:01 +1000 | [diff] [blame] | 54 | MachineLearningServiceImpl::MachineLearningServiceImpl( |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 55 | mojo::ScopedMessagePipeHandle pipe, |
| 56 | base::Closure connection_error_handler, |
| 57 | const std::string& model_dir) |
Honglin Yu | f33dce3 | 2019-12-05 15:10:39 +1100 | [diff] [blame] | 58 | : icu_data_(nullptr), |
| 59 | text_classifier_model_filename_(kTextClassifierModelFile), |
| 60 | builtin_model_metadata_(GetBuiltinModelMetadata()), |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 61 | model_dir_(model_dir), |
hscham | 6886765 | 2020-01-06 11:40:47 +0900 | [diff] [blame] | 62 | binding_(this, |
| 63 | mojo::InterfaceRequest< |
| 64 | chromeos::machine_learning::mojom::MachineLearningService>( |
Honglin Yu | f33dce3 | 2019-12-05 15:10:39 +1100 | [diff] [blame] | 65 | std::move(pipe))) { |
Andrew Moylan | ff6be51 | 2018-07-03 11:05:01 +1000 | [diff] [blame] | 66 | binding_.set_connection_error_handler(std::move(connection_error_handler)); |
| 67 | } |
| 68 | |
Michael Martis | a74af93 | 2018-08-13 16:52:36 +1000 | [diff] [blame] | 69 | MachineLearningServiceImpl::MachineLearningServiceImpl( |
| 70 | mojo::ScopedMessagePipeHandle pipe, base::Closure connection_error_handler) |
| 71 | : MachineLearningServiceImpl(std::move(pipe), |
| 72 | std::move(connection_error_handler), |
| 73 | kSystemModelDir) {} |
| 74 | |
Honglin Yu | f33dce3 | 2019-12-05 15:10:39 +1100 | [diff] [blame] | 75 | void MachineLearningServiceImpl::SetTextClassifierModelFilenameForTesting( |
| 76 | const std::string& filename) { |
| 77 | text_classifier_model_filename_ = filename; |
| 78 | } |
| 79 | |
Andrew Moylan | 2fb80af | 2020-07-08 10:52:08 +1000 | [diff] [blame] | 80 | void MachineLearningServiceImpl::Clone(MachineLearningServiceRequest request) { |
| 81 | clone_bindings_.AddBinding(this, std::move(request)); |
| 82 | } |
| 83 | |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 84 | void MachineLearningServiceImpl::LoadBuiltinModel( |
| 85 | BuiltinModelSpecPtr spec, |
| 86 | ModelRequest request, |
Qijiang Fan | 5d381a0 | 2020-04-19 23:42:37 +0900 | [diff] [blame] | 87 | LoadBuiltinModelCallback callback) { |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 88 | // Unsupported models do not have metadata entries. |
| 89 | const auto metadata_lookup = builtin_model_metadata_.find(spec->id); |
| 90 | if (metadata_lookup == builtin_model_metadata_.end()) { |
Honglin Yu | a81145a | 2019-09-23 15:20:13 +1000 | [diff] [blame] | 91 | LOG(WARNING) << "LoadBuiltinModel requested for unsupported model ID " |
| 92 | << spec->id << "."; |
Qijiang Fan | 5d381a0 | 2020-04-19 23:42:37 +0900 | [diff] [blame] | 93 | std::move(callback).Run(LoadModelResult::MODEL_SPEC_ERROR); |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 94 | RecordModelSpecificationErrorEvent(); |
| 95 | return; |
| 96 | } |
| 97 | |
| 98 | const BuiltinModelMetadata& metadata = metadata_lookup->second; |
| 99 | |
| 100 | DCHECK(!metadata.metrics_model_name.empty()); |
| 101 | |
| 102 | RequestMetrics<LoadModelResult> request_metrics(metadata.metrics_model_name, |
| 103 | kMetricsRequestName); |
| 104 | request_metrics.StartRecordingPerformanceMetrics(); |
| 105 | |
| 106 | // Attempt to load model. |
| 107 | const std::string model_path = model_dir_ + metadata.model_file; |
| 108 | std::unique_ptr<tflite::FlatBufferModel> model = |
| 109 | tflite::FlatBufferModel::BuildFromFile(model_path.c_str()); |
| 110 | if (model == nullptr) { |
| 111 | LOG(ERROR) << "Failed to load model file '" << model_path << "'."; |
Qijiang Fan | 5d381a0 | 2020-04-19 23:42:37 +0900 | [diff] [blame] | 112 | std::move(callback).Run(LoadModelResult::LOAD_MODEL_ERROR); |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 113 | request_metrics.RecordRequestEvent(LoadModelResult::LOAD_MODEL_ERROR); |
| 114 | return; |
| 115 | } |
| 116 | |
Honglin Yu | c0cef10 | 2020-01-17 15:26:01 +1100 | [diff] [blame] | 117 | ModelImpl::Create(metadata.required_inputs, metadata.required_outputs, |
| 118 | std::move(model), std::move(request), |
| 119 | metadata.metrics_model_name); |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 120 | |
Qijiang Fan | 5d381a0 | 2020-04-19 23:42:37 +0900 | [diff] [blame] | 121 | std::move(callback).Run(LoadModelResult::OK); |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 122 | |
| 123 | request_metrics.FinishRecordingPerformanceMetrics(); |
| 124 | request_metrics.RecordRequestEvent(LoadModelResult::OK); |
| 125 | } |
| 126 | |
| 127 | void MachineLearningServiceImpl::LoadFlatBufferModel( |
| 128 | FlatBufferModelSpecPtr spec, |
| 129 | ModelRequest request, |
Qijiang Fan | 5d381a0 | 2020-04-19 23:42:37 +0900 | [diff] [blame] | 130 | LoadFlatBufferModelCallback callback) { |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 131 | DCHECK(!spec->metrics_model_name.empty()); |
| 132 | |
| 133 | RequestMetrics<LoadModelResult> request_metrics(spec->metrics_model_name, |
| 134 | kMetricsRequestName); |
| 135 | request_metrics.StartRecordingPerformanceMetrics(); |
| 136 | |
Andrew Moylan | 79b34a4 | 2020-07-08 11:13:11 +1000 | [diff] [blame] | 137 | // Take the ownership of the content of `model_string` because `ModelImpl` has |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 138 | // to hold the memory. |
| 139 | auto model_string_impl = |
| 140 | std::make_unique<std::string>(std::move(spec->model_string)); |
| 141 | |
| 142 | std::unique_ptr<tflite::FlatBufferModel> model = |
| 143 | tflite::FlatBufferModel::BuildFromBuffer(model_string_impl->c_str(), |
| 144 | model_string_impl->length()); |
| 145 | if (model == nullptr) { |
| 146 | LOG(ERROR) << "Failed to load model string of metric name: " |
| 147 | << spec->metrics_model_name << "'."; |
Qijiang Fan | 5d381a0 | 2020-04-19 23:42:37 +0900 | [diff] [blame] | 148 | std::move(callback).Run(LoadModelResult::LOAD_MODEL_ERROR); |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 149 | request_metrics.RecordRequestEvent(LoadModelResult::LOAD_MODEL_ERROR); |
| 150 | return; |
| 151 | } |
| 152 | |
Honglin Yu | c0cef10 | 2020-01-17 15:26:01 +1100 | [diff] [blame] | 153 | ModelImpl::Create( |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 154 | std::map<std::string, int>(spec->inputs.begin(), spec->inputs.end()), |
| 155 | std::map<std::string, int>(spec->outputs.begin(), spec->outputs.end()), |
| 156 | std::move(model), std::move(model_string_impl), std::move(request), |
| 157 | spec->metrics_model_name); |
| 158 | |
Qijiang Fan | 5d381a0 | 2020-04-19 23:42:37 +0900 | [diff] [blame] | 159 | std::move(callback).Run(LoadModelResult::OK); |
Honglin Yu | 0ed7235 | 2019-08-27 17:42:01 +1000 | [diff] [blame] | 160 | |
| 161 | request_metrics.FinishRecordingPerformanceMetrics(); |
| 162 | request_metrics.RecordRequestEvent(LoadModelResult::OK); |
| 163 | } |
| 164 | |
Honglin Yu | f33dce3 | 2019-12-05 15:10:39 +1100 | [diff] [blame] | 165 | void MachineLearningServiceImpl::LoadTextClassifier( |
| 166 | chromeos::machine_learning::mojom::TextClassifierRequest request, |
| 167 | LoadTextClassifierCallback callback) { |
| 168 | RequestMetrics<LoadModelResult> request_metrics("TextClassifier", |
| 169 | kMetricsRequestName); |
| 170 | request_metrics.StartRecordingPerformanceMetrics(); |
| 171 | |
| 172 | // Attempt to load model. |
| 173 | std::string model_path = model_dir_ + text_classifier_model_filename_; |
| 174 | auto scoped_mmap = |
| 175 | std::make_unique<libtextclassifier3::ScopedMmap>(model_path); |
| 176 | if (!scoped_mmap->handle().ok()) { |
| 177 | LOG(ERROR) << "Failed to load the text classifier model file '" |
| 178 | << model_path << "'."; |
| 179 | std::move(callback).Run(LoadModelResult::LOAD_MODEL_ERROR); |
| 180 | request_metrics.RecordRequestEvent(LoadModelResult::LOAD_MODEL_ERROR); |
| 181 | return; |
| 182 | } |
| 183 | |
| 184 | // Create the TextClassifier. |
| 185 | if (!TextClassifierImpl::Create(&scoped_mmap, std::move(request))) { |
| 186 | LOG(ERROR) << "Failed to create TextClassifierImpl object."; |
| 187 | std::move(callback).Run(LoadModelResult::LOAD_MODEL_ERROR); |
| 188 | request_metrics.RecordRequestEvent(LoadModelResult::LOAD_MODEL_ERROR); |
| 189 | return; |
| 190 | } |
| 191 | |
| 192 | // initialize the icu library. |
| 193 | InitIcuIfNeeded(); |
| 194 | |
| 195 | std::move(callback).Run(LoadModelResult::OK); |
| 196 | |
| 197 | request_metrics.FinishRecordingPerformanceMetrics(); |
| 198 | request_metrics.RecordRequestEvent(LoadModelResult::OK); |
| 199 | } |
| 200 | |
charleszhao | 17777f9 | 2020-04-23 12:53:11 +1000 | [diff] [blame] | 201 | void MachineLearningServiceImpl::LoadHandwritingModel( |
| 202 | HandwritingRecognizerRequest request, |
| 203 | LoadHandwritingModelCallback callback) { |
charleszhao | 05c5a4a | 2020-06-09 16:49:54 +1000 | [diff] [blame] | 204 | // Use english as default language. |
| 205 | LoadHandwritingModelWithSpec(HandwritingRecognizerSpec::New("en"), |
| 206 | std::move(request), std::move(callback)); |
| 207 | } |
| 208 | |
| 209 | void MachineLearningServiceImpl::LoadHandwritingModelWithSpec( |
| 210 | HandwritingRecognizerSpecPtr spec, |
| 211 | HandwritingRecognizerRequest request, |
| 212 | LoadHandwritingModelCallback callback) { |
charleszhao | 17777f9 | 2020-04-23 12:53:11 +1000 | [diff] [blame] | 213 | RequestMetrics<LoadModelResult> request_metrics("HandwritingModel", |
| 214 | kMetricsRequestName); |
| 215 | request_metrics.StartRecordingPerformanceMetrics(); |
| 216 | |
| 217 | // Load HandwritingLibrary. |
| 218 | auto* const hwr_library = ml::HandwritingLibrary::GetInstance(); |
| 219 | |
| 220 | if (hwr_library->GetStatus() == |
| 221 | ml::HandwritingLibrary::Status::kNotSupported) { |
| 222 | LOG(ERROR) << "Initialize ml::HandwritingLibrary with error " |
| 223 | << static_cast<int>(hwr_library->GetStatus()); |
| 224 | |
| 225 | std::move(callback).Run(LoadModelResult::FEATURE_NOT_SUPPORTED_ERROR); |
| 226 | request_metrics.RecordRequestEvent( |
| 227 | LoadModelResult::FEATURE_NOT_SUPPORTED_ERROR); |
| 228 | return; |
| 229 | } |
| 230 | |
| 231 | if (hwr_library->GetStatus() != ml::HandwritingLibrary::Status::kOk) { |
| 232 | LOG(ERROR) << "Initialize ml::HandwritingLibrary with error " |
| 233 | << static_cast<int>(hwr_library->GetStatus()); |
| 234 | |
| 235 | std::move(callback).Run(LoadModelResult::LOAD_MODEL_ERROR); |
| 236 | request_metrics.RecordRequestEvent(LoadModelResult::LOAD_MODEL_ERROR); |
| 237 | return; |
| 238 | } |
| 239 | |
charleszhao | 05c5a4a | 2020-06-09 16:49:54 +1000 | [diff] [blame] | 240 | if (!GetModelPaths(spec.Clone()).has_value()) { |
| 241 | LOG(ERROR) << "LoadHandwritingRecognizer is not called because language " |
| 242 | "code is not supported."; |
| 243 | |
| 244 | std::move(callback).Run(LoadModelResult::LANGUAGE_NOT_SUPPORTED_ERROR); |
| 245 | request_metrics.RecordRequestEvent( |
| 246 | LoadModelResult::LANGUAGE_NOT_SUPPORTED_ERROR); |
| 247 | return; |
| 248 | } |
| 249 | |
charleszhao | 17777f9 | 2020-04-23 12:53:11 +1000 | [diff] [blame] | 250 | // Create HandwritingRecognizer. |
charleszhao | 05c5a4a | 2020-06-09 16:49:54 +1000 | [diff] [blame] | 251 | if (!HandwritingRecognizerImpl::Create(std::move(spec), std::move(request))) { |
charleszhao | 17777f9 | 2020-04-23 12:53:11 +1000 | [diff] [blame] | 252 | LOG(ERROR) << "LoadHandwritingRecognizer returned false."; |
| 253 | std::move(callback).Run(LoadModelResult::LOAD_MODEL_ERROR); |
| 254 | request_metrics.RecordRequestEvent(LoadModelResult::LOAD_MODEL_ERROR); |
| 255 | return; |
| 256 | } |
| 257 | |
| 258 | std::move(callback).Run(LoadModelResult::OK); |
| 259 | request_metrics.FinishRecordingPerformanceMetrics(); |
| 260 | request_metrics.RecordRequestEvent(LoadModelResult::OK); |
| 261 | } |
| 262 | |
Honglin Yu | f33dce3 | 2019-12-05 15:10:39 +1100 | [diff] [blame] | 263 | void MachineLearningServiceImpl::InitIcuIfNeeded() { |
| 264 | if (icu_data_ == nullptr) { |
| 265 | // Need to load the data file again. |
| 266 | int64_t file_size; |
| 267 | const base::FilePath icu_data_file_path(kIcuDataFilePath); |
| 268 | CHECK(base::GetFileSize(icu_data_file_path, &file_size)); |
| 269 | icu_data_ = new char[file_size]; |
| 270 | CHECK(base::ReadFile(icu_data_file_path, icu_data_, |
| 271 | static_cast<int>(file_size)) == file_size); |
| 272 | // Init the Icu library. |
| 273 | UErrorCode err = U_ZERO_ERROR; |
| 274 | udata_setCommonData(reinterpret_cast<void*>(icu_data_), &err); |
| 275 | DCHECK(err == U_ZERO_ERROR); |
| 276 | // Never try to load Icu data from files. |
| 277 | udata_setFileAccess(UDATA_ONLY_PACKAGES, &err); |
| 278 | } |
| 279 | } |
| 280 | |
Andrew Moylan | ff6be51 | 2018-07-03 11:05:01 +1000 | [diff] [blame] | 281 | } // namespace ml |