Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(176)

Unified Diff: components/test/data/dom_distiller/derived_features.json

Issue 1042053003: Add calculation of derived features for distillable page model (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: rebase Created 5 years, 9 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
« no previous file with comments | « components/test/data/dom_distiller/core_features.json ('k') | no next file » | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
Index: components/test/data/dom_distiller/derived_features.json
diff --git a/components/test/data/dom_distiller/derived_features.json b/components/test/data/dom_distiller/derived_features.json
new file mode 100644
index 0000000000000000000000000000000000000000..40071b330b9705a0d962698b457773ea58f89ac0
--- /dev/null
+++ b/components/test/data/dom_distiller/derived_features.json
@@ -0,0 +1,194 @@
+[
+ {
+ "url": "https://zh-tw.facebook.com/permalink.php",
+ "index": 0,
+ "features": [
+ "opengraph",
+ false,
+ "forum",
+ false,
+ "index",
+ false,
+ "view",
+ false,
+ "asp",
+ false,
+ "phpbb",
+ false,
+ "php",
+ true,
+ "pathlength",
+ 14,
+ "domain",
+ false,
+ "pathcomponents",
+ 1,
+ "slugdetector",
+ 1,
+ "pathnumbers",
+ 0,
+ "lastSegmentLength",
+ 13,
+ "formcount",
+ 1,
+ "anchorcount",
+ 26,
+ "elementcount",
+ 120,
+ "anchorratio",
+ 0.21666666666666667,
+ "innertextlength",
+ 492,
+ "textcontentlength",
+ 12832,
+ "innerhtmllength",
+ 19715,
+ "innertextlengthratio",
+ 0.024955617550088766,
+ "textcontentlengthratio",
+ 0.6508749682982501,
+ "innertexttextcontentlengthratio",
+ 0.03834164588528678,
+ "innertextwordcount",
+ 5,
+ "textcontentwordcount",
+ 1470,
+ "innerhtmlwordcount",
+ 2313,
+ "innertextwordcountratio",
+ 0.00216169476869866,
+ "textcontentwordcountratio",
+ 0.6355382619974059,
+ "innertexttextcontentwordcountratio",
+ 0.003401360544217687
+ ]
+ },
+ {
+ "url": "https://zb.getitfree.us/myaccount/survey.html",
+ "index": 1,
+ "features": [
+ "opengraph",
+ false,
+ "forum",
+ false,
+ "index",
+ false,
+ "view",
+ false,
+ "asp",
+ false,
+ "phpbb",
+ false,
+ "php",
+ false,
+ "pathlength",
+ 22,
+ "domain",
+ false,
+ "pathcomponents",
+ 2,
+ "slugdetector",
+ 1,
+ "pathnumbers",
+ 0,
+ "lastSegmentLength",
+ 11,
+ "formcount",
+ 0,
+ "anchorcount",
+ 5,
+ "elementcount",
+ 92,
+ "anchorratio",
+ 0.05434782608695652,
+ "innertextlength",
+ 1137,
+ "textcontentlength",
+ 25037,
+ "innerhtmllength",
+ 33602,
+ "innertextlengthratio",
+ 0.03383727159097673,
+ "textcontentlengthratio",
+ 0.7451044580679721,
+ "innertexttextcontentlengthratio",
+ 0.045412789072173186,
+ "innertextwordcount",
+ 181,
+ "textcontentwordcount",
+ 2811,
+ "innerhtmlwordcount",
+ 3926,
+ "innertextwordcountratio",
+ 0.04610290371879776,
+ "textcontentwordcountratio",
+ 0.7159959246051961,
+ "innertexttextcontentwordcountratio",
+ 0.06438989683386695
+ ]
+ },
+ {
+ "url": "https://yande.re/pool",
+ "index": 2,
+ "features": [
+ "opengraph",
+ false,
+ "forum",
+ false,
+ "index",
+ false,
+ "view",
+ false,
+ "asp",
+ false,
+ "phpbb",
+ false,
+ "php",
+ false,
+ "pathlength",
+ 5,
+ "domain",
+ false,
+ "pathcomponents",
+ 1,
+ "slugdetector",
+ 0,
+ "pathnumbers",
+ 0,
+ "lastSegmentLength",
+ 4,
+ "formcount",
+ 10,
+ "anchorcount",
+ 112,
+ "elementcount",
+ 492,
+ "anchorratio",
+ 0.22764227642276422,
+ "innertextlength",
+ 1676,
+ "textcontentlength",
+ 41089,
+ "innerhtmllength",
+ 56900,
+ "innertextlengthratio",
+ 0.02945518453427065,
+ "textcontentlengthratio",
+ 0.7221265377855888,
+ "innertexttextcontentlengthratio",
+ 0.04078950570712356,
+ "innertextwordcount",
+ 303,
+ "textcontentwordcount",
+ 3874,
+ "innerhtmlwordcount",
+ 6502,
+ "innertextwordcountratio",
+ 0.04660104583205168,
+ "textcontentwordcountratio",
+ 0.5958166717932943,
+ "innertexttextcontentwordcountratio",
+ 0.07821373257614868
+ ]
+ }
+]
« no previous file with comments | « components/test/data/dom_distiller/core_features.json ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698