1 // Copyright 2015 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
5 #include "components/dom_distiller/content/distillable_page_utils.h"
8 #include "base/location.h"
9 #include "base/single_thread_task_runner.h"
10 #include "base/strings/utf_string_conversions.h"
11 #include "base/thread_task_runner_handle.h"
12 #include "base/values.h"
13 #include "components/dom_distiller/content/distiller_javascript_utils.h"
14 #include "components/dom_distiller/core/distillable_page_detector.h"
15 #include "components/dom_distiller/core/experiments.h"
16 #include "components/dom_distiller/core/page_features.h"
17 #include "content/public/browser/render_frame_host.h"
18 #include "grit/components_resources.h"
19 #include "ui/base/resource/resource_bundle.h"
21 namespace dom_distiller
{
23 void OnOGArticleJsResult(base::Callback
<void(bool)> callback
,
24 const base::Value
* result
) {
27 result
->GetAsBoolean(&success
);
29 callback
.Run(success
);
32 void OnExtractFeaturesJsResult(const DistillablePageDetector
* detector
,
33 base::Callback
<void(bool)> callback
,
34 const base::Value
* result
) {
35 callback
.Run(detector
->Classify(CalculateDerivedFeaturesFromJSON(result
)));
39 void IsOpenGraphArticle(content::WebContents
* web_contents
,
40 base::Callback
<void(bool)> callback
) {
41 content::RenderFrameHost
* main_frame
= web_contents
->GetMainFrame();
43 base::ThreadTaskRunnerHandle::Get()->PostTask(FROM_HERE
,
44 base::Bind(callback
, false));
47 std::string og_article_js
= ResourceBundle::GetSharedInstance()
48 .GetRawDataResource(IDR_IS_DISTILLABLE_JS
)
50 RunIsolatedJavaScript(main_frame
, og_article_js
,
51 base::Bind(OnOGArticleJsResult
, callback
));
54 void IsDistillablePage(content::WebContents
* web_contents
,
55 bool is_mobile_optimized
,
56 base::Callback
<void(bool)> callback
) {
57 switch (GetDistillerHeuristicsType()) {
58 case DistillerHeuristicsType::ALWAYS_TRUE
:
59 base::ThreadTaskRunnerHandle::Get()->PostTask(FROM_HERE
,
60 base::Bind(callback
, true));
62 case DistillerHeuristicsType::OG_ARTICLE
:
63 IsOpenGraphArticle(web_contents
, callback
);
65 case DistillerHeuristicsType::ADABOOST_MODEL
:
66 // The adaboost model is only applied to non-mobile pages.
67 if (is_mobile_optimized
) {
68 base::ThreadTaskRunnerHandle::Get()->PostTask(
69 FROM_HERE
, base::Bind(callback
, false));
72 IsDistillablePageForDetector(
73 web_contents
, DistillablePageDetector::GetDefault(), callback
);
75 case DistillerHeuristicsType::NONE
:
77 base::ThreadTaskRunnerHandle::Get()->PostTask(
78 FROM_HERE
, base::Bind(callback
, false));
83 void IsDistillablePageForDetector(content::WebContents
* web_contents
,
84 const DistillablePageDetector
* detector
,
85 base::Callback
<void(bool)> callback
) {
86 content::RenderFrameHost
* main_frame
= web_contents
->GetMainFrame();
88 base::ThreadTaskRunnerHandle::Get()->PostTask(FROM_HERE
,
89 base::Bind(callback
, false));
92 std::string extract_features_js
=
93 ResourceBundle::GetSharedInstance()
94 .GetRawDataResource(IDR_EXTRACT_PAGE_FEATURES_JS
)
96 RunIsolatedJavaScript(
97 main_frame
, extract_features_js
,
98 base::Bind(OnExtractFeaturesJsResult
, detector
, callback
));
101 } // namespace dom_distiller