2 * Copyright 2001-2007 Internet2
\r
4 * Licensed under the Apache License, Version 2.0 (the "License");
\r
5 * you may not use this file except in compliance with the License.
\r
6 * You may obtain a copy of the License at
\r
8 * http://www.apache.org/licenses/LICENSE-2.0
\r
10 * Unless required by applicable law or agreed to in writing, software
\r
11 * distributed under the License is distributed on an "AS IS" BASIS,
\r
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
\r
13 * See the License for the specific language governing permissions and
\r
14 * limitations under the License.
\r
17 /** XMLRequestMapper.cpp
\r
19 * XML-based RequestMapper implementation
\r
22 #include "internal.h"
\r
23 #include "exceptions.h"
\r
24 #include "AccessControl.h"
\r
25 #include "RequestMapper.h"
\r
26 #include "SPRequest.h"
\r
27 #include "util/DOMPropertySet.h"
\r
28 #include "util/SPConstants.h"
\r
30 #include <xmltooling/util/NDC.h>
\r
31 #include <xmltooling/util/ReloadableXMLFile.h>
\r
32 #include <xmltooling/util/XMLHelper.h>
\r
33 #include <xercesc/util/XMLUniDefs.hpp>
\r
34 #include <xercesc/util/regx/RegularExpression.hpp>
\r
36 using namespace shibsp;
\r
37 using namespace xmltooling;
\r
38 using namespace std;
\r
42 // Blocks access when an ACL plugin fails to load.
\r
43 class AccessControlDummy : public AccessControl
\r
52 bool authorized(const SPRequest& request, const Session* session) const {
\r
57 class Override : public DOMPropertySet, public DOMNodeFilter
\r
60 Override() : m_base(NULL), m_acl(NULL) {}
\r
61 Override(const DOMElement* e, Category& log, const Override* base=NULL);
\r
65 pair<bool,bool> getBool(const char* name, const char* ns=NULL) const;
\r
66 pair<bool,const char*> getString(const char* name, const char* ns=NULL) const;
\r
67 pair<bool,const XMLCh*> getXMLString(const char* name, const char* ns=NULL) const;
\r
68 pair<bool,unsigned int> getUnsignedInt(const char* name, const char* ns=NULL) const;
\r
69 pair<bool,int> getInt(const char* name, const char* ns=NULL) const;
\r
70 const PropertySet* getPropertySet(const char* name, const char* ns="urn:mace:shibboleth:2.0:native:sp:config") const;
\r
72 // Provides filter to exclude special config elements.
\r
73 short acceptNode(const DOMNode* node) const {
\r
74 return FILTER_REJECT;
\r
77 const Override* locate(const SPRequest& request) const;
\r
78 AccessControl* getAC() const { return (m_acl ? m_acl : (m_base ? m_base->getAC() : NULL)); }
\r
81 void loadACL(const DOMElement* e, Category& log);
\r
83 map<string,Override*> m_map;
\r
84 vector< pair<RegularExpression*,Override*> > m_regexps;
\r
85 vector< pair< pair<string,RegularExpression*>,Override*> > m_queries;
\r
88 const Override* m_base;
\r
89 AccessControl* m_acl;
\r
92 class XMLRequestMapperImpl : public Override
\r
95 XMLRequestMapperImpl(const DOMElement* e, Category& log);
\r
97 ~XMLRequestMapperImpl() {
\r
99 m_document->release();
\r
102 void setDocument(DOMDocument* doc) {
\r
106 const Override* findOverride(const char* vhost, const SPRequest& request) const;
\r
109 map<string,Override*> m_extras;
\r
110 DOMDocument* m_document;
\r
113 #if defined (_MSC_VER)
\r
114 #pragma warning( push )
\r
115 #pragma warning( disable : 4250 )
\r
118 class XMLRequestMapper : public RequestMapper, public ReloadableXMLFile
\r
121 XMLRequestMapper(const DOMElement* e) : ReloadableXMLFile(e,Category::getInstance(SHIBSP_LOGCAT".RequestMapper")), m_impl(NULL) {
\r
125 ~XMLRequestMapper() {
\r
129 Settings getSettings(const SPRequest& request) const;
\r
132 pair<bool,DOMElement*> load();
\r
135 XMLRequestMapperImpl* m_impl;
\r
138 #if defined (_MSC_VER)
\r
139 #pragma warning( pop )
\r
142 RequestMapper* SHIBSP_DLLLOCAL XMLRequestMapperFactory(const DOMElement* const & e)
\r
144 return new XMLRequestMapper(e);
\r
147 static const XMLCh _AccessControl[] = UNICODE_LITERAL_13(A,c,c,e,s,s,C,o,n,t,r,o,l);
\r
148 static const XMLCh AccessControlProvider[] = UNICODE_LITERAL_21(A,c,c,e,s,s,C,o,n,t,r,o,l,P,r,o,v,i,d,e,r);
\r
149 static const XMLCh Host[] = UNICODE_LITERAL_4(H,o,s,t);
\r
150 static const XMLCh HostRegex[] = UNICODE_LITERAL_9(H,o,s,t,R,e,g,e,x);
\r
151 static const XMLCh htaccess[] = UNICODE_LITERAL_8(h,t,a,c,c,e,s,s);
\r
152 static const XMLCh ignoreCase[] = UNICODE_LITERAL_10(i,g,n,o,r,e,C,a,s,e);
\r
153 static const XMLCh ignoreOption[] = UNICODE_LITERAL_1(i);
\r
154 static const XMLCh Path[] = UNICODE_LITERAL_4(P,a,t,h);
\r
155 static const XMLCh PathRegex[] = UNICODE_LITERAL_9(P,a,t,h,R,e,g,e,x);
\r
156 static const XMLCh Query[] = UNICODE_LITERAL_5(Q,u,e,r,y);
\r
157 static const XMLCh name[] = UNICODE_LITERAL_4(n,a,m,e);
\r
158 static const XMLCh regex[] = UNICODE_LITERAL_5(r,e,g,e,x);
\r
159 static const XMLCh _type[] = UNICODE_LITERAL_4(t,y,p,e);
\r
162 void SHIBSP_API shibsp::registerRequestMappers()
\r
164 SPConfig& conf=SPConfig::getConfig();
\r
165 conf.RequestMapperManager.registerFactory(XML_REQUEST_MAPPER, XMLRequestMapperFactory);
\r
166 conf.RequestMapperManager.registerFactory(NATIVE_REQUEST_MAPPER, XMLRequestMapperFactory);
\r
169 void Override::loadACL(const DOMElement* e, Category& log)
\r
172 const DOMElement* acl=XMLHelper::getFirstChildElement(e,htaccess);
\r
174 log.info("building Apache htaccess AccessControl provider...");
\r
175 m_acl=SPConfig::getConfig().AccessControlManager.newPlugin(HT_ACCESS_CONTROL,acl);
\r
178 acl=XMLHelper::getFirstChildElement(e,_AccessControl);
\r
180 log.info("building XML-based AccessControl provider...");
\r
181 m_acl=SPConfig::getConfig().AccessControlManager.newPlugin(XML_ACCESS_CONTROL,acl);
\r
184 acl=XMLHelper::getFirstChildElement(e,AccessControlProvider);
\r
186 auto_ptr_char type(acl->getAttributeNS(NULL,_type));
\r
187 log.info("building AccessControl provider of type %s...",type.get());
\r
188 m_acl=SPConfig::getConfig().AccessControlManager.newPlugin(type.get(),acl);
\r
193 catch (exception& ex) {
\r
194 log.crit("exception building AccessControl provider: %s", ex.what());
\r
195 m_acl = new AccessControlDummy();
\r
199 Override::Override(const DOMElement* e, Category& log, const Override* base) : m_base(base), m_acl(NULL)
\r
202 // Load the property set.
\r
205 // Load any AccessControl provider.
\r
208 // Handle nested Paths.
\r
209 DOMElement* path = XMLHelper::getFirstChildElement(e,Path);
\r
210 for (int i=1; path; ++i, path=XMLHelper::getNextSiblingElement(path,Path)) {
\r
211 const XMLCh* n=path->getAttributeNS(NULL,name);
\r
213 // Skip any leading slashes.
\r
214 while (n && *n==chForwardSlash)
\r
217 // Check for empty name.
\r
219 log.warn("skipping Path element (%d) with empty name attribute", i);
\r
223 // Check for an embedded slash.
\r
224 int slash=XMLString::indexOf(n,chForwardSlash);
\r
226 // Copy the first path segment.
\r
227 XMLCh* namebuf=new XMLCh[slash + 1];
\r
228 for (int pos=0; pos < slash; pos++)
\r
229 namebuf[pos]=n[pos];
\r
230 namebuf[slash]=chNull;
\r
232 // Move past the slash in the original pathname.
\r
235 // Skip any leading slashes again.
\r
236 while (*n==chForwardSlash)
\r
240 // Create a placeholder Path element for the first path segment and replant under it.
\r
241 DOMElement* newpath=path->getOwnerDocument()->createElementNS(shibspconstants::SHIB2SPCONFIG_NS,Path);
\r
242 newpath->setAttributeNS(NULL,name,namebuf);
\r
243 path->setAttributeNS(NULL,name,n);
\r
244 path->getParentNode()->replaceChild(newpath,path);
\r
245 newpath->appendChild(path);
\r
247 // Repoint our locals at the new parent.
\r
249 n=path->getAttributeNS(NULL,name);
\r
252 // All we had was a pathname with trailing slash(es), so just reset it without them.
\r
253 path->setAttributeNS(NULL,name,namebuf);
\r
254 n=path->getAttributeNS(NULL,name);
\r
259 Override* o=new Override(path,log,this);
\r
260 pair<bool,const char*> name=o->getString("name");
\r
261 char* dup=strdup(name.second);
\r
262 for (char* pch=dup; *pch; pch++)
\r
263 *pch=tolower(*pch);
\r
264 if (m_map.count(dup)) {
\r
265 log.warn("skipping duplicate Path element (%s)",dup);
\r
271 log.debug("added Path mapping (%s)", dup);
\r
275 if (!XMLString::equals(e->getLocalName(), PathRegex)) {
\r
276 // Handle nested PathRegexs.
\r
277 path = XMLHelper::getFirstChildElement(e,PathRegex);
\r
278 for (int i=1; path; ++i, path=XMLHelper::getNextSiblingElement(path,PathRegex)) {
\r
279 const XMLCh* n=path->getAttributeNS(NULL,regex);
\r
281 log.warn("skipping PathRegex element (%d) with empty regex attribute",i);
\r
285 auto_ptr<Override> o(new Override(path,log,this));
\r
287 const XMLCh* flag=path->getAttributeNS(NULL,ignoreCase);
\r
289 auto_ptr<RegularExpression> re(
\r
290 new RegularExpression(n, (flag && (*flag==chLatin_f || *flag==chDigit_0)) ? &chNull : ignoreOption)
\r
292 m_regexps.push_back(make_pair(re.release(), o.release()));
\r
294 catch (XMLException& ex) {
\r
295 auto_ptr_char tmp(ex.getMessage());
\r
296 log.error("caught exception while parsing PathRegex regular expression (%d): %s", i, tmp.get());
\r
297 throw ConfigurationException("Invalid regular expression in PathRegex element.");
\r
300 if (log.isDebugEnabled())
\r
301 log.debug("added <PathRegex> mapping (%s)", m_regexps.back().second->getString("regex").second);
\r
305 // Handle nested Querys.
\r
306 path = XMLHelper::getFirstChildElement(e,Query);
\r
307 for (int i=1; path; ++i, path=XMLHelper::getNextSiblingElement(path,Query)) {
\r
308 const XMLCh* n=path->getAttributeNS(NULL,name);
\r
310 log.warn("skipping Query element (%d) with empty name attribute",i);
\r
313 auto_ptr_char ntemp(n);
\r
314 const XMLCh* v=path->getAttributeNS(NULL,regex);
\r
316 auto_ptr<Override> o(new Override(path,log,this));
\r
318 RegularExpression* re = NULL;
\r
320 re = new RegularExpression(v);
\r
321 m_queries.push_back(make_pair(make_pair(ntemp.get(),re), o.release()));
\r
323 catch (XMLException& ex) {
\r
324 auto_ptr_char tmp(ex.getMessage());
\r
325 log.error("caught exception while parsing Query regular expression (%d): %s", i, tmp.get());
\r
326 throw ConfigurationException("Invalid regular expression in Query element.");
\r
329 log.debug("added <Query> mapping (%s)", ntemp.get());
\r
332 catch (exception&) {
\r
334 for_each(m_map.begin(),m_map.end(),xmltooling::cleanup_pair<string,Override>());
\r
339 Override::~Override()
\r
342 for_each(m_map.begin(),m_map.end(),xmltooling::cleanup_pair<string,Override>());
\r
343 for (vector< pair<RegularExpression*,Override*> >::iterator i = m_regexps.begin(); i != m_regexps.end(); ++i) {
\r
347 for (vector< pair< pair<string,RegularExpression*>,Override*> >::iterator j = m_queries.begin(); j != m_queries.end(); ++j) {
\r
348 delete j->first.second;
\r
353 pair<bool,bool> Override::getBool(const char* name, const char* ns) const
\r
355 pair<bool,bool> ret=DOMPropertySet::getBool(name,ns);
\r
358 return m_base ? m_base->getBool(name,ns) : ret;
\r
361 pair<bool,const char*> Override::getString(const char* name, const char* ns) const
\r
363 pair<bool,const char*> ret=DOMPropertySet::getString(name,ns);
\r
366 return m_base ? m_base->getString(name,ns) : ret;
\r
369 pair<bool,const XMLCh*> Override::getXMLString(const char* name, const char* ns) const
\r
371 pair<bool,const XMLCh*> ret=DOMPropertySet::getXMLString(name,ns);
\r
374 return m_base ? m_base->getXMLString(name,ns) : ret;
\r
377 pair<bool,unsigned int> Override::getUnsignedInt(const char* name, const char* ns) const
\r
379 pair<bool,unsigned int> ret=DOMPropertySet::getUnsignedInt(name,ns);
\r
382 return m_base ? m_base->getUnsignedInt(name,ns) : ret;
\r
385 pair<bool,int> Override::getInt(const char* name, const char* ns) const
\r
387 pair<bool,int> ret=DOMPropertySet::getInt(name,ns);
\r
390 return m_base ? m_base->getInt(name,ns) : ret;
\r
393 const PropertySet* Override::getPropertySet(const char* name, const char* ns) const
\r
395 const PropertySet* ret=DOMPropertySet::getPropertySet(name,ns);
\r
396 if (ret || !m_base)
\r
398 return m_base->getPropertySet(name,ns);
\r
401 const Override* Override::locate(const SPRequest& request) const
\r
403 // This function is confusing because it's *not* recursive.
\r
404 // The whole path is tokenized and mapped in a loop, so the
\r
405 // path parameter starts with the entire request path and
\r
406 // we can skip the leading slash as irrelevant.
\r
407 const char* path = request.getRequestURI();
\r
411 // Now we copy the path, chop the query string, and lower case it.
\r
412 char* dup=strdup(path);
\r
413 char* sep=strchr(dup,'?');
\r
416 for (char* pch=dup; *pch; pch++)
\r
417 *pch=tolower(*pch);
\r
419 // Default is for the current object to provide settings.
\r
420 const Override* o=this;
\r
422 // Tokenize the path by segment and try and map each segment.
\r
423 #ifdef HAVE_STRTOK_R
\r
425 const char* token=strtok_r(dup,"/",&pos);
\r
427 const char* token=strtok(dup,"/");
\r
430 map<string,Override*>::const_iterator i=o->m_map.find(token);
\r
431 if (i==o->m_map.end())
\r
432 break; // Once there's no match, we've consumed as much of the path as possible here.
\r
433 // We found a match, so reset the settings pointer.
\r
436 // We descended a step down the path, so we need to advance the original
\r
437 // parameter for the regex step later.
\r
438 path += strlen(token);
\r
442 // Get the next segment, if any.
\r
443 #ifdef HAVE_STRTOK_R
\r
444 token=strtok_r(NULL,"/",&pos);
\r
446 token=strtok(NULL,"/");
\r
452 // If there's anything left, we try for a regex match on the rest of the path minus the query string.
\r
454 string path2(path);
\r
455 path2 = path2.substr(0,path2.find('?'));
\r
457 for (vector< pair<RegularExpression*,Override*> >::const_iterator re = o->m_regexps.begin(); re != o->m_regexps.end(); ++re) {
\r
458 if (re->first->matches(path2.c_str())) {
\r
465 // Finally, check for query string matches. This is another "unrolled" recursive descent in a loop.
\r
469 for (vector< pair< pair<string,RegularExpression*>,Override*> >::const_iterator q = o->m_queries.begin(); !descended && q != o->m_queries.end(); ++q) {
\r
470 vector<const char*> vals;
\r
471 if (request.getParameters(q->first.first.c_str(), vals)) {
\r
472 if (q->first.second) {
\r
473 // We have to match one of the values.
\r
474 for (vector<const char*>::const_iterator v = vals.begin(); v != vals.end(); ++v) {
\r
475 if (q->first.second->matches(*v)) {
\r
483 // The simple presence of the parameter is sufficient to match.
\r
489 } while (descended);
\r
494 XMLRequestMapperImpl::XMLRequestMapperImpl(const DOMElement* e, Category& log) : m_document(NULL)
\r
497 xmltooling::NDC ndc("XMLRequestMapperImpl");
\r
500 // Load the property set.
\r
503 // Load any AccessControl provider.
\r
506 // Loop over the HostRegex elements.
\r
507 const DOMElement* host = XMLHelper::getFirstChildElement(e,HostRegex);
\r
508 for (int i=1; host; ++i, host=XMLHelper::getNextSiblingElement(host,HostRegex)) {
\r
509 const XMLCh* n=host->getAttributeNS(NULL,regex);
\r
511 log.warn("Skipping HostRegex element (%d) with empty regex attribute",i);
\r
515 auto_ptr<Override> o(new Override(host,log,this));
\r
517 const XMLCh* flag=host->getAttributeNS(NULL,ignoreCase);
\r
519 auto_ptr<RegularExpression> re(
\r
520 new RegularExpression(n, (flag && (*flag==chLatin_f || *flag==chDigit_0)) ? &chNull : ignoreOption)
\r
522 m_regexps.push_back(make_pair(re.release(), o.release()));
\r
524 catch (XMLException& ex) {
\r
525 auto_ptr_char tmp(ex.getMessage());
\r
526 log.error("caught exception while parsing HostRegex regular expression (%d): %s", i, tmp.get());
\r
529 log.debug("Added <HostRegex> mapping for %s", m_regexps.back().second->getString("regex").second);
\r
532 // Loop over the Host elements.
\r
533 host = XMLHelper::getFirstChildElement(e,Host);
\r
534 for (int i=1; host; ++i, host=XMLHelper::getNextSiblingElement(host,Host)) {
\r
535 const XMLCh* n=host->getAttributeNS(NULL,name);
\r
537 log.warn("Skipping Host element (%d) with empty name attribute",i);
\r
541 Override* o=new Override(host,log,this);
\r
542 pair<bool,const char*> name=o->getString("name");
\r
543 pair<bool,const char*> scheme=o->getString("scheme");
\r
544 pair<bool,const char*> port=o->getString("port");
\r
546 char* dup=strdup(name.second);
\r
547 for (char* pch=dup; *pch; pch++)
\r
548 *pch=tolower(*pch);
\r
549 auto_ptr<char> dupwrap(dup);
\r
551 if (!scheme.first && port.first) {
\r
552 // No scheme, but a port, so assume http.
\r
553 scheme = pair<bool,const char*>(true,"http");
\r
555 else if (scheme.first && !port.first) {
\r
556 // Scheme, no port, so default it.
\r
557 // XXX Use getservbyname instead?
\r
559 if (!strcmp(scheme.second,"http"))
\r
560 port.second = "80";
\r
561 else if (!strcmp(scheme.second,"https"))
\r
562 port.second = "443";
\r
563 else if (!strcmp(scheme.second,"ftp"))
\r
564 port.second = "21";
\r
565 else if (!strcmp(scheme.second,"ldap"))
\r
566 port.second = "389";
\r
567 else if (!strcmp(scheme.second,"ldaps"))
\r
568 port.second = "636";
\r
571 if (scheme.first) {
\r
572 string url(scheme.second);
\r
573 url=url + "://" + dup;
\r
575 // Is this the default port?
\r
576 if ((!strcmp(scheme.second,"http") && !strcmp(port.second,"80")) ||
\r
577 (!strcmp(scheme.second,"https") && !strcmp(port.second,"443")) ||
\r
578 (!strcmp(scheme.second,"ftp") && !strcmp(port.second,"21")) ||
\r
579 (!strcmp(scheme.second,"ldap") && !strcmp(port.second,"389")) ||
\r
580 (!strcmp(scheme.second,"ldaps") && !strcmp(port.second,"636"))) {
\r
581 // First store a port-less version.
\r
582 if (m_map.count(url) || m_extras.count(url)) {
\r
583 log.warn("Skipping duplicate Host element (%s)",url.c_str());
\r
588 log.debug("Added <Host> mapping for %s",url.c_str());
\r
590 // Now append the port. We use the extras vector, to avoid double freeing the object later.
\r
591 url=url + ':' + port.second;
\r
593 log.debug("Added <Host> mapping for %s",url.c_str());
\r
596 url=url + ':' + port.second;
\r
597 if (m_map.count(url) || m_extras.count(url)) {
\r
598 log.warn("Skipping duplicate Host element (%s)",url.c_str());
\r
603 log.debug("Added <Host> mapping for %s",url.c_str());
\r
607 // No scheme or port, so we enter dual hosts on http:80 and https:443
\r
608 string url("http://");
\r
610 if (m_map.count(url) || m_extras.count(url)) {
\r
611 log.warn("Skipping duplicate Host element (%s)",url.c_str());
\r
616 log.debug("Added <Host> mapping for %s",url.c_str());
\r
619 if (m_map.count(url) || m_extras.count(url)) {
\r
620 log.warn("Skipping duplicate Host element (%s)",url.c_str());
\r
624 log.debug("Added <Host> mapping for %s",url.c_str());
\r
628 if (m_map.count(url) || m_extras.count(url)) {
\r
629 log.warn("Skipping duplicate Host element (%s)",url.c_str());
\r
633 log.debug("Added <Host> mapping for %s",url.c_str());
\r
635 url = url + ":443";
\r
636 if (m_map.count(url) || m_extras.count(url)) {
\r
637 log.warn("Skipping duplicate Host element (%s)",url.c_str());
\r
641 log.debug("Added <Host> mapping for %s",url.c_str());
\r
646 const Override* XMLRequestMapperImpl::findOverride(const char* vhost, const SPRequest& request) const
\r
648 const Override* o=NULL;
\r
649 map<string,Override*>::const_iterator i=m_map.find(vhost);
\r
650 if (i!=m_map.end())
\r
653 i=m_extras.find(vhost);
\r
654 if (i!=m_extras.end())
\r
657 for (vector< pair<RegularExpression*,Override*> >::const_iterator re = m_regexps.begin(); !o && re != m_regexps.end(); ++re) {
\r
658 if (re->first->matches(vhost))
\r
664 return o ? o->locate(request) : this;
\r
667 pair<bool,DOMElement*> XMLRequestMapper::load()
\r
669 // Load from source using base class.
\r
670 pair<bool,DOMElement*> raw = ReloadableXMLFile::load();
\r
672 // If we own it, wrap it.
\r
673 XercesJanitor<DOMDocument> docjanitor(raw.first ? raw.second->getOwnerDocument() : NULL);
\r
675 XMLRequestMapperImpl* impl = new XMLRequestMapperImpl(raw.second,m_log);
\r
677 // If we held the document, transfer it to the impl. If we didn't, it's a no-op.
\r
678 impl->setDocument(docjanitor.release());
\r
683 return make_pair(false,(DOMElement*)NULL);
\r
686 RequestMapper::Settings XMLRequestMapper::getSettings(const SPRequest& request) const
\r
688 ostringstream vhost;
\r
689 vhost << request.getScheme() << "://" << request.getHostname() << ':' << request.getPort();
\r
691 const Override* o=m_impl->findOverride(vhost.str().c_str(), request);
\r
693 if (m_log.isDebugEnabled()) {
\r
695 xmltooling::NDC ndc("getSettings");
\r
697 pair<bool,const char*> ret=o->getString("applicationId");
\r
698 m_log.debug("mapped %s%s to %s", vhost.str().c_str(), request.getRequestURI() ? request.getRequestURI() : "", ret.second);
\r
701 return Settings(o,o->getAC());
\r