1 // Copyright 2014 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file.
7 package dom_distiller.proto;
8 option optimize_for = LITE_RUNTIME;
9 option java_package = "com.dom_distiller.proto";
10 option java_outer_classname = "DomDistillerProtos";
12 message DistilledContent {
13 optional string html = 1;
16 message PaginationInfo {
17 optional string next_page = 1;
18 optional string prev_page = 2;
19 optional string canonical_page = 3;
22 message MarkupArticle {
23 optional string published_time = 1;
24 optional string modified_time = 2;
25 optional string expiration_time = 3;
26 optional string section = 4;
27 repeated string authors = 5;
31 optional string url = 1;
32 optional string secure_url = 2;
33 optional string type = 3;
34 optional string caption = 4;
35 optional int32 width = 5;
36 optional int32 height = 6;
40 optional string title = 1;
41 optional string type = 2;
42 optional string url = 3;
43 optional string description = 4;
44 optional string publisher = 5;
45 optional string copyright = 6;
46 optional string author = 7;
47 optional MarkupArticle article = 8;
48 repeated MarkupImage images = 9;
51 message DomDistillerResult {
52 optional string title = 1;
53 optional DistilledContent distilled_content = 2;
54 optional PaginationInfo pagination_info = 3;
55 repeated string image_urls = 4;
56 optional MarkupInfo markup_info = 5;
59 message DomDistillerOptions {
60 // Whether to extract only the text (or to include the containing html).
61 optional bool extract_text_only = 1;
63 // How much debug output to dump to window.console.
65 // (1): Text Node data for each stage of processing
66 // (2): (1) and some node visibility information
67 // (3): (2) and extracted paging information
68 optional int32 debug_level = 2;