15821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Copyright (c) 2012 The Chromium Authors. All rights reserved.
25821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Use of this source code is governed by a BSD-style license that can be
35821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// found in the LICENSE file.
45821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
55821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#ifndef CONTENT_RENDERER_ANDROID_CONTENT_DETECTOR_H_
65821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#define CONTENT_RENDERER_ANDROID_CONTENT_DETECTOR_H_
75821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
87d4cd473f85ac64c3747c96c277f9e506a0d2246Torne (Richard Coles)#include "third_party/WebKit/public/web/WebRange.h"
97dbb3d5cf0c15f500944d211057644d6a2f37371Ben Murdoch#include "url/gurl.h"
105821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
11f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)namespace blink {
125821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)class WebHitTestResult;
135821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}
145821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
155821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)namespace content {
165821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
175821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)// Base class for text-based content detectors.
185821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)class ContentDetector {
195821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) public:
205821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Holds the content detection results.
215821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  struct Result {
225821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    Result();
23f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    Result(const blink::WebRange& content_boundaries,
245821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)           const std::string& text,
255821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)           const GURL& intent_url);
265821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    ~Result();
275821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
285821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    bool valid;
29f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    blink::WebRange content_boundaries;
305821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    std::string text; // Processed text of the content.
315821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)    GURL intent_url; // URL of the intent that should process this content.
325821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  };
335821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
345821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  virtual ~ContentDetector() {}
355821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
365821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Returns a WebKit range delimiting the contents found around the tapped
375821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // position. If no content is found a null range will be returned.
38f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  Result FindTappedContent(const blink::WebHitTestResult& hit_test);
395821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
405821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles) protected:
415821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  ContentDetector() {}
425821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
435821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Parses the input string defined by the begin/end iterators returning true
445821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // if the desired content is found. The start and end positions relative to
455821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // the input iterators are returned in start_pos and end_pos.
465821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // The end position is assumed to be non-inclusive.
47a3f6a49ab37290eeeb8db0f41ec0f1cb74a68be7Torne (Richard Coles)  virtual bool FindContent(const base::string16::const_iterator& begin,
48a3f6a49ab37290eeeb8db0f41ec0f1cb74a68be7Torne (Richard Coles)                           const base::string16::const_iterator& end,
495821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                           size_t* start_pos,
505821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                           size_t* end_pos,
515821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                           std::string* content_text) = 0;
525821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
535821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Returns the intent URL that should process the content, if any.
545821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  virtual GURL GetIntentURL(const std::string& content_text) = 0;
555821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
565821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // Returns the maximum length of text to be extracted around the tapped
575821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  // position in order to search for content.
585821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  virtual size_t GetMaximumContentLength() = 0;
595821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
60f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  blink::WebRange FindContentRange(const blink::WebHitTestResult& hit_test,
615821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)                                    std::string* content_text);
625821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
635821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)  DISALLOW_COPY_AND_ASSIGN(ContentDetector);
645821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)};
655821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
665821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)}  // namespace content
675821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)
685821806d5e7f356e8fa4b058a389a808ea183019Torne (Richard Coles)#endif  // CONTENT_RENDERER_ANDROID_CONTENT_DETECTOR_H_
69