File: language_detection_model.cc

package info (click to toggle)
chromium 141.0.7390.107-1~deb12u1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm-proposed-updates
  • size: 6,254,812 kB
  • sloc: cpp: 35,264,957; ansic: 7,169,920; javascript: 4,250,185; python: 1,460,636; asm: 950,788; xml: 751,751; pascal: 187,972; sh: 89,459; perl: 88,691; objc: 79,953; sql: 53,924; cs: 44,622; fortran: 24,137; makefile: 22,319; tcl: 15,277; php: 14,018; yacc: 8,995; ruby: 7,553; awk: 3,720; lisp: 3,096; lex: 1,330; ada: 727; jsp: 228; sed: 36
file content (82 lines) | stat: -rw-r--r-- 2,922 bytes parent folder | download | duplicates (4)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
// Copyright 2024 The Chromium Authors
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.

#include "third_party/blink/renderer/platform/language_detection/language_detection_model.h"

#include <map>
#include <string>
#include <string_view>

#include "base/functional/bind.h"
#include "base/functional/callback.h"
#include "base/types/expected.h"
#include "components/language_detection/content/common/language_detection.mojom-blink.h"
#include "components/language_detection/content/renderer/language_detection_model_manager.h"
#include "components/language_detection/core/language_detection_model.h"
#include "mojo/public/cpp/bindings/remote.h"
#include "third_party/blink/public/common/thread_safe_browser_interface_broker_proxy.h"
#include "third_party/blink/renderer/platform/heap/persistent.h"
#include "third_party/blink/renderer/platform/wtf/functional.h"

namespace blink {

void LanguageDetectionModel::LoadModelFile(
    base::File model_file,
    CreateLanguageDetectionModelCallback callback) {
  language_detection_model_.UpdateWithFileAsync(
      std::move(model_file),
      blink::BindOnce(
          [](LanguageDetectionModel* model,
             CreateLanguageDetectionModelCallback callback) {
            if (!model || !model->language_detection_model_.IsAvailable()) {
              std::move(callback).Run(
                  base::unexpected(DetectLanguageError::kUnavailable));
              return;
            }
            std::move(callback).Run(model);
          },
          WrapWeakPersistent(this), std::move(callback)));
}

void LanguageDetectionModel::Trace(Visitor* visitor) const {}

void LanguageDetectionModel::DetectLanguage(
    scoped_refptr<base::SequencedTaskRunner>& task_runner,
    const String& text,
    DetectLanguageCallback on_complete) {
  if (!language_detection_model_.IsAvailable()) {
    std::move(on_complete)
        .Run(base::unexpected(blink::DetectLanguageError::kUnavailable));
    return;
  }
  task_runner->PostTask(
      FROM_HERE,
      blink::BindOnce(&LanguageDetectionModel::DetectLanguageImpl,
                      WrapPersistent(this), text, std::move(on_complete)));
}

void LanguageDetectionModel::DetectLanguageImpl(
    const String& text,
    DetectLanguageCallback on_complete) {
  String text_16 = text;
  text_16.Ensure16Bit();
  auto score_by_language =
      language_detection_model_.PredictWithScan(text_16.View16());

  Vector<LanguagePrediction> predictions;
  predictions.reserve(static_cast<wtf_size_t>(score_by_language.size()));
  for (const auto& it : score_by_language) {
    predictions.emplace_back(it.language, it.score);
  }
  std::move(on_complete).Run(predictions);
}

int64_t LanguageDetectionModel::GetModelSize() const {
  if (!language_detection_model_.IsAvailable()) {
    return 0;
  }
  return language_detection_model_.GetModelSize();
}

}  // namespace blink