| 1 | |
|
| 2 | |
|
| 3 | |
|
| 4 | |
|
| 5 | |
|
| 6 | |
|
| 7 | |
|
| 8 | |
|
| 9 | |
|
| 10 | |
|
| 11 | |
|
| 12 | |
|
| 13 | |
|
| 14 | |
|
| 15 | |
|
| 16 | |
|
| 17 | |
|
| 18 | |
|
| 19 | |
|
| 20 | |
|
| 21 | |
|
| 22 | |
|
| 23 | |
|
| 24 | |
|
| 25 | |
|
| 26 | |
|
| 27 | |
|
| 28 | |
|
| 29 | |
|
| 30 | |
|
| 31 | |
|
| 32 | |
package net.sourceforge.pebble.logging; |
| 33 | |
|
| 34 | |
import java.net.URLDecoder; |
| 35 | |
import java.util.regex.Matcher; |
| 36 | |
import java.util.regex.Pattern; |
| 37 | |
|
| 38 | |
|
| 39 | |
|
| 40 | |
|
| 41 | |
|
| 42 | |
|
| 43 | |
|
| 44 | |
public class Referer extends CountedUrl { |
| 45 | |
|
| 46 | |
|
| 47 | 4 | private static final Pattern GOOGLE_QUERY_STRING_PATTERN = Pattern.compile("[?&]q=[^&]+&*"); |
| 48 | |
|
| 49 | |
|
| 50 | |
private static final String GOOGLE_PREFIX = "http://www.google."; |
| 51 | |
|
| 52 | |
|
| 53 | 4 | private static final Pattern GOOGLE_IMAGES_QUERY_STRING_PATTERN = Pattern.compile("[?&]prev=[^&]+&*"); |
| 54 | |
|
| 55 | |
|
| 56 | |
private static final String GOOGLE_IMAGES_PREFIX = "http://images.google."; |
| 57 | |
|
| 58 | |
|
| 59 | 4 | private static final Pattern YAHOO_QUERY_STRING_PATTERN = Pattern.compile("[?&]p=[^&]+&*"); |
| 60 | |
|
| 61 | |
|
| 62 | |
private static final String YAHOO_PREFIX = "http://search.yahoo."; |
| 63 | |
|
| 64 | |
|
| 65 | 4 | private static final Pattern MSN_QUERY_STRING_PATTERN = Pattern.compile("[?&]q=[^&]+&*"); |
| 66 | |
|
| 67 | |
|
| 68 | |
private static final String MSN_PREFIX = "http://search.msn."; |
| 69 | |
|
| 70 | |
|
| 71 | |
private static final String MSN_BETA_PREFIX = "http://beta.search.msn."; |
| 72 | |
|
| 73 | |
|
| 74 | 4 | private static final Pattern BING_QUERY_STRING_PATTERN = Pattern.compile("[?&]q=[^&]+&*"); |
| 75 | |
|
| 76 | |
|
| 77 | |
private static final String BING_PREFIX = "http://www.bing.com"; |
| 78 | |
|
| 79 | |
|
| 80 | 4 | private static final Pattern JAVABLOGS_WELCOME_PATTERN = Pattern.compile(".*javablogs.com/Welcome.*"); |
| 81 | |
|
| 82 | |
|
| 83 | 4 | private static final Pattern JAVABLOGS_HOT_ENTRIES_PATTERN = Pattern.compile(".*javablogs.com/ViewHotBlogEntries.*"); |
| 84 | |
|
| 85 | |
|
| 86 | |
|
| 87 | |
|
| 88 | |
|
| 89 | |
|
| 90 | |
public Referer(String url) { |
| 91 | 240 | super(url); |
| 92 | 240 | } |
| 93 | |
|
| 94 | |
protected void setUrl(String url) { |
| 95 | 240 | super.setUrl(url); |
| 96 | |
|
| 97 | 240 | if (url == null || url.length() == 0) { |
| 98 | 20 | setName("None"); |
| 99 | 220 | } else if (url.length() > GOOGLE_PREFIX.length() && |
| 100 | |
url.substring(0, GOOGLE_PREFIX.length()).equalsIgnoreCase(GOOGLE_PREFIX)) { |
| 101 | |
|
| 102 | 40 | String query = extractQuery(GOOGLE_QUERY_STRING_PATTERN, url); |
| 103 | 40 | setName("Google : " + query); |
| 104 | 40 | } else if (url.length() > GOOGLE_IMAGES_PREFIX.length() && |
| 105 | |
url.substring(0, GOOGLE_IMAGES_PREFIX.length()).equalsIgnoreCase(GOOGLE_IMAGES_PREFIX)) { |
| 106 | |
|
| 107 | 8 | String query = extractQuery(GOOGLE_IMAGES_QUERY_STRING_PATTERN, url); |
| 108 | 8 | query = extractQuery(GOOGLE_QUERY_STRING_PATTERN, query); |
| 109 | 8 | setName("Google Images : " + query); |
| 110 | 8 | } else if (url.length() > YAHOO_PREFIX.length() && |
| 111 | |
url.substring(0, YAHOO_PREFIX.length()).equalsIgnoreCase(YAHOO_PREFIX)) { |
| 112 | |
|
| 113 | 28 | String query = extractQuery(YAHOO_QUERY_STRING_PATTERN, url); |
| 114 | 28 | setName("Yahoo! : " + query); |
| 115 | 28 | } else if (url.length() > MSN_PREFIX.length() && |
| 116 | |
url.substring(0, MSN_PREFIX.length()).equalsIgnoreCase(MSN_PREFIX)) { |
| 117 | |
|
| 118 | 0 | String query = extractQuery(MSN_QUERY_STRING_PATTERN, url); |
| 119 | 0 | setName("MSN : " + query); |
| 120 | 0 | } else if (url.length() > MSN_BETA_PREFIX.length() && |
| 121 | |
url.substring(0, MSN_BETA_PREFIX.length()).equalsIgnoreCase(MSN_BETA_PREFIX)) { |
| 122 | |
|
| 123 | 0 | String query = extractQuery(MSN_QUERY_STRING_PATTERN, url); |
| 124 | 0 | setName("MSN beta : " + query); |
| 125 | 0 | } else if (url.length() >= BING_PREFIX.length() && |
| 126 | |
url.substring(0, BING_PREFIX.length()).equalsIgnoreCase(BING_PREFIX)) { |
| 127 | |
|
| 128 | 24 | String query = extractQuery(BING_QUERY_STRING_PATTERN, url); |
| 129 | 24 | setName("Bing : " + query); |
| 130 | 24 | } else if (JAVABLOGS_WELCOME_PATTERN.matcher(url).matches()) { |
| 131 | 16 | setName("java.blogs : Welcome"); |
| 132 | 104 | } else if (JAVABLOGS_HOT_ENTRIES_PATTERN.matcher(url).matches()) { |
| 133 | 4 | setName("java.blogs : Hot Entries"); |
| 134 | |
} else { |
| 135 | 100 | setName(url); |
| 136 | |
} |
| 137 | 240 | } |
| 138 | |
|
| 139 | |
private String extractQuery(Pattern pattern, String url) { |
| 140 | 108 | Matcher m = pattern.matcher(url); |
| 141 | 108 | String query = ""; |
| 142 | 108 | if (m.find()) { |
| 143 | 68 | int start = m.start(); |
| 144 | 68 | int end = m.end(); |
| 145 | 68 | query = url.substring(start+3, end); |
| 146 | 68 | if (query.endsWith("&")) { |
| 147 | 36 | query = query.substring(0, query.length()-1); |
| 148 | |
} |
| 149 | |
try { |
| 150 | 68 | query = URLDecoder.decode(query, "UTF-8"); |
| 151 | 4 | } catch (Exception e) { |
| 152 | 64 | } |
| 153 | |
} |
| 154 | |
|
| 155 | 108 | return query; |
| 156 | |
} |
| 157 | |
|
| 158 | |
|
| 159 | |
|
| 160 | |
|
| 161 | |
|
| 162 | |
|
| 163 | |
public String getDomainFilter() { |
| 164 | |
|
| 165 | 8 | if (getUrl() == null) { |
| 166 | 0 | return null; |
| 167 | |
} |
| 168 | |
|
| 169 | 8 | int index = getUrl().indexOf("://"); |
| 170 | 8 | if (index == -1) { |
| 171 | 4 | return getUrl(); |
| 172 | |
} |
| 173 | |
|
| 174 | 4 | String domainName = getUrl().substring(index+3); |
| 175 | 4 | index = domainName.indexOf("/"); |
| 176 | |
|
| 177 | 4 | if (index > -1) { |
| 178 | 0 | domainName = domainName.substring(0, index); |
| 179 | |
} |
| 180 | |
|
| 181 | 4 | if (domainName.indexOf(":") > -1) { |
| 182 | |
|
| 183 | 0 | domainName = domainName.substring(0, domainName.indexOf(":")); |
| 184 | |
} |
| 185 | |
|
| 186 | 4 | return ".*" + domainName + ".*"; |
| 187 | |
} |
| 188 | |
|
| 189 | |
} |