doxy/link__check_8cpp_source.html

 //  link_check implementation  -----------------------------------------------//

 //  Copyright Beman Dawes 2002.
 //  Distributed under the Boost Software License, Version 1.0.
 //  (See accompanying file LICENSE_1_0.txt or copy at
 //  http://www.boost.org/LICENSE_1_0.txt)

 #include "link_check.hpp"
 #include <boost/regex.hpp>
 #include <boost/filesystem/operations.hpp>
 #include <boost/filesystem/exception.hpp>

 namespace fs = boost::filesystem;

 namespace
 {
 boost::regex url_regex (
     "<\\s*[^>]*\\s+(?:HREF|SRC)" // HREF or SRC
     "\\s*=\\s*\"([^\"]*)\"",
     boost::regbase::normal | boost::regbase::icase);

 } // unnamed namespace

 namespace boost
 {
 namespace inspect
 {

 //  link_check constructor  --------------------------------------------------//

 link_check::link_check()
     : m_broken_errors (0), m_unlinked_errors (0), m_invalid_errors (0),
       m_bookmark_errors (0)
 {
 }

 //  inspect (all)  -----------------------------------------------------------//

 void link_check::inspect (
     const string& library_name,
     const path& full_path )
 {
     // keep track of paths already encountered to reduce disk activity
     if ( !fs::is_directory ( full_path ) )
     {
         m_paths[ relative_to ( full_path, fs::initial_path() ) ] |= m_present;
     }
 }

 //  inspect ( .htm, .html )  -------------------------------------------------//

 void link_check::inspect (
     const string& library_name,
     const path& full_path,    // example: c:/foo/boost/filesystem/path.hpp
     const string& contents )      // contents of file to be inspected
 {
     string::const_iterator start ( contents.begin() );
     string::const_iterator end ( contents.end() );
     boost::match_results< string::const_iterator > what;
     boost::match_flag_type flags = boost::match_default;

     while ( boost::regex_search ( start, end, what, url_regex, flags) )
     {
         // what[0] contains the whole string iterators.
         // what[1] contains the URL iterators.
         do_url ( string ( what[1].first, what[1].second ),
                  library_name, full_path );

         start = what[0].second; // update search position
         flags |= boost::match_prev_avail; // update flags
         flags |= boost::match_not_bob;
     }
 }

 //  do_url  ------------------------------------------------------------------//

 void link_check::do_url ( const string& url, const string& library_name,
                           const path& source_path )  // precondition: source_path.is_complete()
 {
     if ( url[0] == '#'
             || url.find ( "mailto:" ) == 0
             || url.find ( "http:" ) == 0
             || url.find ( "https:" ) == 0
             || url.find ( "ftp:" ) == 0
             || url.find ( "news:" ) == 0
             || url.find ( "javascript:" ) == 0
        )
     {
         return;
     }

     if ( url.find ( "file:" ) == 0 )
     {
         ++m_invalid_errors;
         error ( library_name, source_path, "invalid URL (hardwired file): " + url );
         return;
     }

     // detect characters banned by RFC2396:
     if ( url.find_first_of ( " <>\"{}|\\^[]'" ) != string::npos )
     {
         ++m_invalid_errors;
         error ( library_name, source_path, "invalid character in URL: " + url );
     }

     // strip url of bookmarks
     string plain_url ( url );
     string::size_type pos ( plain_url.find ( '#' ) );
     if ( pos != string::npos )
     {
         plain_url.erase ( pos );
         // detect characters banned by RFC2396 in bookmark:
         if ( url.find ( '#', pos + 1 ) != string::npos )
         {
             ++m_bookmark_errors;
             error ( library_name, source_path, "invalid bookmark: " + url );
         }
     }

     // strip url of references to current dir
     if ( plain_url[0] == '.' && plain_url[1] == '/' )
     {
         plain_url.erase ( 0, 2 );
     }

     // url is relative source_path.branch()
     // convert to target_path, which is_complete()
     path target_path;
     try
     {
         target_path = source_path.branch_path() /= path ( plain_url, fs::no_check );
     }
     catch ( const fs::filesystem_error& )
     {
         ++m_invalid_errors;
         error ( library_name, source_path, "invalid URL: " + url );
         return;
     }

     // create a m_paths entry if necessary
     std::pair< const string, int > entry (
         relative_to ( target_path, fs::initial_path() ), 0 );
     m_path_map::iterator itr ( m_paths.find ( entry.first ) );
     if ( itr == m_paths.end() )
     {
         if ( fs::exists ( target_path ) )
         {
             entry.second = m_present;
         }
         itr = m_paths.insert ( entry ).first;
     }

     // itr now points to the m_paths entry
     itr->second |= m_linked_to;

     // if target isn't present, the link is broken
     if ( (itr->second & m_present) == 0 )
     {
         ++m_broken_errors;
         error ( library_name, source_path, "broken link: " + url );
     }
 }

 //  close  -------------------------------------------------------------------//

 void link_check::close()
 {
     for ( m_path_map::const_iterator itr = m_paths.begin();
             itr != m_paths.end(); ++itr )
     {
         // std::clog << itr->first << " " << itr->second << "\n";
         if ( (itr->second & m_linked_to) != m_linked_to
                 && (itr->first.rfind ( ".html" ) == itr->first.size() - 5
                     || itr->first.rfind ( ".htm" ) == itr->first.size() - 4)
                 // because they may be redirectors, it is OK if these are unlinked:
                 && itr->first.rfind ( "index.html" ) == string::npos
                 && itr->first.rfind ( "index.htm" ) == string::npos )
         {
             ++m_unlinked_errors;
             path full_path ( fs::initial_path() / path (itr->first, fs::no_check) );
             error ( impute_library ( full_path ), full_path, "unlinked file" );
         }
     }
 }

 } // namespace inspect
 } // namespace boost
anonymous_namespace{link_check.cpp}::url_regex
boost::regex url_regex("<\*[^>]*\+(?:HREF|SRC)" "\*=\*\[^\*)\, boost::regbase::normal|boost::regbase::icase)

boost
Definition: copyright_check.cpp:10

boost::inspect::link_check::inspect
virtual void inspect(const std::string &library_name, const path &full_path)

boost::inspect::link_check::m_broken_errors
long m_broken_errors
Definition: link_check.hpp:26

LifeV::MeshIO::anonymous_namespace{ParserGmsh.hpp}::elm_nodes_num
static const LifeV::UInt elm_nodes_num[]
Definition: ParserGmsh.hpp:57

boost::inspect::link_check::inspect
virtual void inspect(const std::string &library_name, const path &full_path, const std::string &contents)

boost::inspect::link_check::link_check
link_check()
Definition: link_check.cpp:31

boost::inspect
Definition: copyright_check.cpp:12

boost::inspect::link_check::do_url
void do_url(const string &url, const string &library_name, const path &full_source_path)
Definition: link_check.cpp:77

boost::inspect::link_check::close
virtual void close()
Definition: link_check.cpp:166

boost::inspect::link_check::m_bookmark_errors
long m_bookmark_errors
Definition: link_check.hpp:29

boost::inspect::link_check::m_unlinked_errors
long m_unlinked_errors
Definition: link_check.hpp:27

boost::inspect::link_check
Definition: link_check.hpp:24

boost::inspect::link_check::m_invalid_errors
long m_invalid_errors
Definition: link_check.hpp:28