• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (C) 2010 The Android Open Source Project
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13  * See the License for the specific language governing permissions and
14  * limitations under the License.
15  */
16 
17 package com.android.browser;
18 
19 import android.net.Uri;
20 import android.util.Patterns;
21 import android.webkit.URLUtil;
22 
23 import java.util.regex.Matcher;
24 import java.util.regex.Pattern;
25 
26 /**
27  * Utility methods for Url manipulation
28  */
29 public class UrlUtils {
30 
31     static final Pattern ACCEPTED_URI_SCHEMA = Pattern.compile(
32             "(?i)" + // switch on case insensitive matching
33             "(" +    // begin group for schema
34             "(?:http|https|file):\\/\\/" +
35             "|(?:data|about|javascript):" +
36             "|(?:.*:.*@)" +
37             ")" +
38             "(.*)" );
39 
40     // Google search
41     private final static String QUICKSEARCH_G = "http://www.google.com/m?q=%s";
42     private final static String QUERY_PLACE_HOLDER = "%s";
43 
44     // Regular expression to strip http:// and optionally
45     // the trailing slash
46     private static final Pattern STRIP_URL_PATTERN =
47             Pattern.compile("^http://(.*?)/?$");
48 
UrlUtils()49     private UrlUtils() { /* cannot be instantiated */ }
50 
51     /**
52      * Strips the provided url of preceding "http://" and any trailing "/". Does not
53      * strip "https://". If the provided string cannot be stripped, the original string
54      * is returned.
55      *
56      * TODO: Put this in TextUtils to be used by other packages doing something similar.
57      *
58      * @param url a url to strip, like "http://www.google.com/"
59      * @return a stripped url like "www.google.com", or the original string if it could
60      *         not be stripped
61      */
stripUrl(String url)62     public static String stripUrl(String url) {
63         if (url == null) return null;
64         Matcher m = STRIP_URL_PATTERN.matcher(url);
65         if (m.matches()) {
66             return m.group(1);
67         } else {
68             return url;
69         }
70     }
71 
smartUrlFilter(Uri inUri)72     protected static String smartUrlFilter(Uri inUri) {
73         if (inUri != null) {
74             return smartUrlFilter(inUri.toString());
75         }
76         return null;
77     }
78 
79     /**
80      * Attempts to determine whether user input is a URL or search
81      * terms.  Anything with a space is passed to search.
82      *
83      * Converts to lowercase any mistakenly uppercased schema (i.e.,
84      * "Http://" converts to "http://"
85      *
86      * @return Original or modified URL
87      *
88      */
smartUrlFilter(String url)89     public static String smartUrlFilter(String url) {
90         return smartUrlFilter(url, true);
91     }
92 
93     /**
94      * Attempts to determine whether user input is a URL or search
95      * terms.  Anything with a space is passed to search if canBeSearch is true.
96      *
97      * Converts to lowercase any mistakenly uppercased schema (i.e.,
98      * "Http://" converts to "http://"
99      *
100      * @param canBeSearch If true, will return a search url if it isn't a valid
101      *                    URL. If false, invalid URLs will return null
102      * @return Original or modified URL
103      *
104      */
smartUrlFilter(String url, boolean canBeSearch)105     public static String smartUrlFilter(String url, boolean canBeSearch) {
106         String inUrl = url.trim();
107         boolean hasSpace = inUrl.indexOf(' ') != -1;
108 
109         Matcher matcher = ACCEPTED_URI_SCHEMA.matcher(inUrl);
110         if (matcher.matches()) {
111             // force scheme to lowercase
112             String scheme = matcher.group(1);
113             String lcScheme = scheme.toLowerCase();
114             if (!lcScheme.equals(scheme)) {
115                 inUrl = lcScheme + matcher.group(2);
116             }
117             if (hasSpace && Patterns.WEB_URL.matcher(inUrl).matches()) {
118                 inUrl = inUrl.replace(" ", "%20");
119             }
120             return inUrl;
121         }
122         if (!hasSpace) {
123             if (Patterns.WEB_URL.matcher(inUrl).matches()) {
124                 return URLUtil.guessUrl(inUrl);
125             }
126         }
127         if (canBeSearch) {
128             return URLUtil.composeSearchUrl(inUrl,
129                     QUICKSEARCH_G, QUERY_PLACE_HOLDER);
130         }
131         return null;
132     }
133 
fixUrl(String inUrl)134     /* package */ static String fixUrl(String inUrl) {
135         // FIXME: Converting the url to lower case
136         // duplicates functionality in smartUrlFilter().
137         // However, changing all current callers of fixUrl to
138         // call smartUrlFilter in addition may have unwanted
139         // consequences, and is deferred for now.
140         int colon = inUrl.indexOf(':');
141         boolean allLower = true;
142         for (int index = 0; index < colon; index++) {
143             char ch = inUrl.charAt(index);
144             if (!Character.isLetter(ch)) {
145                 break;
146             }
147             allLower &= Character.isLowerCase(ch);
148             if (index == colon - 1 && !allLower) {
149                 inUrl = inUrl.substring(0, colon).toLowerCase()
150                         + inUrl.substring(colon);
151             }
152         }
153         if (inUrl.startsWith("http://") || inUrl.startsWith("https://"))
154             return inUrl;
155         if (inUrl.startsWith("http:") ||
156                 inUrl.startsWith("https:")) {
157             if (inUrl.startsWith("http:/") || inUrl.startsWith("https:/")) {
158                 inUrl = inUrl.replaceFirst("/", "//");
159             } else inUrl = inUrl.replaceFirst(":", "://");
160         }
161         return inUrl;
162     }
163 
164     // Returns the filtered URL. Cannot return null, but can return an empty string
filteredUrl(String inUrl)165     /* package */ static String filteredUrl(String inUrl) {
166         if (inUrl == null) {
167             return "";
168         }
169         if (inUrl.startsWith("content:")
170                 || inUrl.startsWith("browser:")) {
171             return "";
172         }
173         return inUrl;
174     }
175 
176 }
177