]> git.argeo.org Git - lgpl/argeo-commons.git/blob - org.argeo.cms/src/org/argeo/cms/internal/kernel/NodeHttp.java
0510b3c837116053f1ac5c8265e5c2213b96885d
[lgpl/argeo-commons.git] / org.argeo.cms / src / org / argeo / cms / internal / kernel / NodeHttp.java
1 package org.argeo.cms.internal.kernel;
2
3 import static javax.jcr.Property.JCR_DESCRIPTION;
4 import static javax.jcr.Property.JCR_LAST_MODIFIED;
5 import static javax.jcr.Property.JCR_TITLE;
6 import static org.argeo.cms.CmsTypes.CMS_IMAGE;
7
8 import java.io.IOException;
9 import java.io.PrintWriter;
10 import java.security.PrivilegedExceptionAction;
11 import java.security.cert.X509Certificate;
12 import java.util.Calendar;
13 import java.util.Collection;
14 import java.util.Enumeration;
15
16 import javax.jcr.Node;
17 import javax.jcr.NodeIterator;
18 import javax.jcr.Repository;
19 import javax.jcr.RepositoryException;
20 import javax.jcr.Session;
21 import javax.security.auth.Subject;
22 import javax.servlet.FilterChain;
23 import javax.servlet.ServletException;
24 import javax.servlet.http.HttpServlet;
25 import javax.servlet.http.HttpServletRequest;
26 import javax.servlet.http.HttpServletResponse;
27 import javax.servlet.http.HttpSession;
28
29 import org.apache.commons.logging.Log;
30 import org.apache.commons.logging.LogFactory;
31 import org.argeo.cms.CmsException;
32 import org.argeo.jcr.JcrUtils;
33 import org.argeo.node.NodeConstants;
34 import org.osgi.framework.BundleContext;
35 import org.osgi.framework.ServiceReference;
36 import org.osgi.service.http.HttpService;
37
38 /**
39 * Intercepts and enriches http access, mainly focusing on security and
40 * transactionality.
41 */
42 class NodeHttp implements KernelConstants {
43 private final static Log log = LogFactory.getLog(NodeHttp.class);
44
45 // Filters
46 // private final RootFilter rootFilter;
47
48 // private final DoSFilter dosFilter;
49 // private final QoSFilter qosFilter;
50
51 private BundleContext bc;
52
53 NodeHttp(HttpService httpService, BundleContext bc) {
54 this.bc = bc;
55 // rootFilter = new RootFilter();
56 // dosFilter = new CustomDosFilter();
57 // qosFilter = new QoSFilter();
58
59 try {
60 httpService.registerServlet("/!", new LinkServlet(), null, null);
61 httpService.registerServlet("/robots.txt", new RobotServlet(), null, null);
62 } catch (Exception e) {
63 throw new CmsException("Cannot register filters", e);
64 }
65 }
66
67 public void destroy() {
68 }
69
70 class LinkServlet extends HttpServlet {
71 private static final long serialVersionUID = 3749990143146845708L;
72
73 @Override
74 protected void service(HttpServletRequest request, HttpServletResponse response)
75 throws ServletException, IOException {
76 String path = request.getPathInfo();
77 String userAgent = request.getHeader("User-Agent").toLowerCase();
78 boolean isBot = false;
79 boolean isCompatibleBrowser = false;
80 if (userAgent.contains("bot") || userAgent.contains("facebook") || userAgent.contains("twitter")) {
81 isBot = true;
82 } else if (userAgent.contains("webkit") || userAgent.contains("gecko") || userAgent.contains("firefox")
83 || userAgent.contains("msie") || userAgent.contains("chrome") || userAgent.contains("chromium")
84 || userAgent.contains("opera") || userAgent.contains("browser")) {
85 isCompatibleBrowser = true;
86 }
87
88 if (isBot) {
89 log.warn("# BOT " + request.getHeader("User-Agent"));
90 canonicalAnswer(request, response, path);
91 return;
92 }
93
94 if (isCompatibleBrowser && log.isTraceEnabled())
95 log.trace("# BWS " + request.getHeader("User-Agent"));
96 redirectTo(response, "/#" + path);
97 }
98
99 private void redirectTo(HttpServletResponse response, String location) {
100 response.setHeader("Location", location);
101 response.setStatus(HttpServletResponse.SC_FOUND);
102 }
103
104 // private boolean canonicalAnswerNeededBy(HttpServletRequest request) {
105 // String userAgent = request.getHeader("User-Agent").toLowerCase();
106 // return userAgent.startsWith("facebookexternalhit/");
107 // }
108
109 /** For bots which don't understand RWT. */
110 private void canonicalAnswer(HttpServletRequest request, HttpServletResponse response, String path) {
111 Session session = null;
112 try {
113 PrintWriter writer = response.getWriter();
114 session = Subject.doAs(KernelUtils.anonymousLogin(), new PrivilegedExceptionAction<Session>() {
115
116 @Override
117 public Session run() throws Exception {
118 Collection<ServiceReference<Repository>> srs = bc.getServiceReferences(Repository.class, "("
119 + NodeConstants.JCR_REPOSITORY_ALIAS + "=" + NodeConstants.ALIAS_NODE + ")");
120 Repository repository = bc.getService(srs.iterator().next());
121 return repository.login();
122 }
123
124 });
125 Node node = session.getNode(path);
126 String title = node.hasProperty(JCR_TITLE) ? node.getProperty(JCR_TITLE).getString() : node.getName();
127 String desc = node.hasProperty(JCR_DESCRIPTION) ? node.getProperty(JCR_DESCRIPTION).getString() : null;
128 Calendar lastUpdate = node.hasProperty(JCR_LAST_MODIFIED)
129 ? node.getProperty(JCR_LAST_MODIFIED).getDate() : null;
130 String url = KernelUtils.getCanonicalUrl(node, request);
131 String imgUrl = null;
132 loop: for (NodeIterator it = node.getNodes(); it.hasNext();) {
133 // Takes the first found cms:image
134 Node child = it.nextNode();
135 if (child.isNodeType(CMS_IMAGE)) {
136 imgUrl = KernelUtils.getDataUrl(child, request);
137 break loop;
138 }
139 }
140 StringBuilder buf = new StringBuilder();
141 buf.append("<html>");
142 buf.append("<head>");
143 writeMeta(buf, "og:title", escapeHTML(title));
144 writeMeta(buf, "og:type", "website");
145 buf.append("<meta name='twitter:card' content='summary' />");
146 buf.append("<meta name='twitter:site' content='@argeo_org' />");
147 writeMeta(buf, "og:url", url);
148 if (desc != null)
149 writeMeta(buf, "og:description", escapeHTML(desc));
150 if (imgUrl != null)
151 writeMeta(buf, "og:image", imgUrl);
152 if (lastUpdate != null)
153 writeMeta(buf, "og:updated_time", Long.toString(lastUpdate.getTime().getTime()));
154 buf.append("</head>");
155 buf.append("<body>");
156 buf.append(
157 "<p><b>!! This page is meant for indexing robots, not for real people," + " visit <a href='/#")
158 .append(path).append("'>").append(escapeHTML(title)).append("</a> instead.</b></p>");
159 writeCanonical(buf, node);
160 buf.append("</body>");
161 buf.append("</html>");
162 writer.print(buf.toString());
163
164 response.setHeader("Content-Type", "text/html");
165 writer.flush();
166 } catch (Exception e) {
167 throw new CmsException("Cannot write canonical answer", e);
168 } finally {
169 JcrUtils.logoutQuietly(session);
170 }
171 }
172
173 /**
174 * From
175 * http://stackoverflow.com/questions/1265282/recommended-method-for-
176 * escaping-html-in-java (+ escaping '). TODO Use
177 * org.apache.commons.lang.StringEscapeUtils
178 */
179 private String escapeHTML(String s) {
180 StringBuilder out = new StringBuilder(Math.max(16, s.length()));
181 for (int i = 0; i < s.length(); i++) {
182 char c = s.charAt(i);
183 if (c > 127 || c == '\'' || c == '"' || c == '<' || c == '>' || c == '&') {
184 out.append("&#");
185 out.append((int) c);
186 out.append(';');
187 } else {
188 out.append(c);
189 }
190 }
191 return out.toString();
192 }
193
194 private void writeMeta(StringBuilder buf, String tag, String value) {
195 buf.append("<meta property='").append(tag).append("' content='").append(value).append("'/>");
196 }
197
198 private void writeCanonical(StringBuilder buf, Node node) throws RepositoryException {
199 buf.append("<div>");
200 if (node.hasProperty(JCR_TITLE))
201 buf.append("<p>").append(node.getProperty(JCR_TITLE).getString()).append("</p>");
202 if (node.hasProperty(JCR_DESCRIPTION))
203 buf.append("<p>").append(node.getProperty(JCR_DESCRIPTION).getString()).append("</p>");
204 NodeIterator children = node.getNodes();
205 while (children.hasNext()) {
206 writeCanonical(buf, children.nextNode());
207 }
208 buf.append("</div>");
209 }
210 }
211
212 class RobotServlet extends HttpServlet {
213 private static final long serialVersionUID = 7935661175336419089L;
214
215 @Override
216 protected void service(HttpServletRequest request, HttpServletResponse response)
217 throws ServletException, IOException {
218 PrintWriter writer = response.getWriter();
219 writer.append("User-agent: *\n");
220 writer.append("Disallow:\n");
221 response.setHeader("Content-Type", "text/plain");
222 writer.flush();
223 }
224
225 }
226
227 /** Intercepts all requests. Authenticates. */
228 class RootFilter extends HttpFilter {
229
230 @Override
231 public void doFilter(HttpSession httpSession, HttpServletRequest request, HttpServletResponse response,
232 FilterChain filterChain) throws IOException, ServletException {
233 if (log.isTraceEnabled()) {
234 log.trace(request.getRequestURL()
235 .append(request.getQueryString() != null ? "?" + request.getQueryString() : ""));
236 logRequest(request);
237 }
238
239 String servletPath = request.getServletPath();
240
241 // client certificate
242 X509Certificate clientCert = extractCertificate(request);
243 if (clientCert != null) {
244 // TODO authenticate
245 // if (log.isDebugEnabled())
246 // log.debug(clientCert.getSubjectX500Principal().getName());
247 }
248
249 // skip data
250 if (servletPath.startsWith(PATH_DATA)) {
251 filterChain.doFilter(request, response);
252 return;
253 }
254
255 // skip /ui (workbench) for the time being
256 if (servletPath.startsWith(PATH_WORKBENCH)) {
257 filterChain.doFilter(request, response);
258 return;
259 }
260
261 // redirect long RWT paths to anchor
262 String path = request.getRequestURI().substring(servletPath.length());
263 int pathLength = path.length();
264 if (pathLength != 0 && (path.charAt(0) == '/') && !servletPath.endsWith("rwt-resources")
265 && !path.startsWith(KernelConstants.PATH_WORKBENCH) && path.lastIndexOf('/') != 0) {
266 String newLocation = request.getServletPath() + "#" + path;
267 response.setHeader("Location", newLocation);
268 response.setStatus(HttpServletResponse.SC_FOUND);
269 return;
270 }
271
272 // process normally
273 filterChain.doFilter(request, response);
274 }
275 }
276
277 private void logRequest(HttpServletRequest request) {
278 log.debug("contextPath=" + request.getContextPath());
279 log.debug("servletPath=" + request.getServletPath());
280 log.debug("requestURI=" + request.getRequestURI());
281 log.debug("queryString=" + request.getQueryString());
282 StringBuilder buf = new StringBuilder();
283 // headers
284 Enumeration<String> en = request.getHeaderNames();
285 while (en.hasMoreElements()) {
286 String header = en.nextElement();
287 Enumeration<String> values = request.getHeaders(header);
288 while (values.hasMoreElements())
289 buf.append(" " + header + ": " + values.nextElement());
290 buf.append('\n');
291 }
292
293 // attributed
294 Enumeration<String> an = request.getAttributeNames();
295 while (an.hasMoreElements()) {
296 String attr = an.nextElement();
297 Object value = request.getAttribute(attr);
298 buf.append(" " + attr + ": " + value);
299 buf.append('\n');
300 }
301 log.debug("\n" + buf);
302 }
303
304 private X509Certificate extractCertificate(HttpServletRequest req) {
305 X509Certificate[] certs = (X509Certificate[]) req.getAttribute("javax.servlet.request.X509Certificate");
306 if (null != certs && certs.length > 0) {
307 return certs[0];
308 }
309 return null;
310 }
311
312 // class CustomDosFilter extends DoSFilter {
313 // @Override
314 // protected String extractUserId(ServletRequest request) {
315 // HttpSession httpSession = ((HttpServletRequest) request)
316 // .getSession();
317 // if (isSessionAuthenticated(httpSession)) {
318 // String userId = ((SecurityContext) httpSession
319 // .getAttribute(SPRING_SECURITY_CONTEXT_KEY))
320 // .getAuthentication().getName();
321 // return userId;
322 // }
323 // return super.extractUserId(request);
324 //
325 // }
326 // }
327 }