HTML-ExtractMain

 view release on metacpan or  search on metacpan

t/test_case_data/google_blogger.html  view on Meta::CPAN

<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
<html dir='ltr' xmlns='http://www.w3.org/1999/xhtml' xmlns:b='http://www.google.com/2005/gml/b' xmlns:data='http://www.google.com/2005/gml/data' xmlns:expr='http://www.google.com/2005/gml/expr'>
<head>
<script type="text/javascript">(function() { var a=window;function c(b){this.t={};this.tick=function(d,i,e){e=e?e:(new Date).getTime();this.t[d]=[e,i]};this.tick("start",null,b)}var f=new c;a.jstiming={Timer:c,load:f};try{var g=null;if(a.chrome&&a.ch...
<meta content='text/html; charset=UTF-8' http-equiv='Content-Type'/>
<meta content='true' name='MSSmartTagsPreventParsing'/>
<meta content='blogger' name='generator'/>
<link href='http://www.blogger.com/favicon.ico' rel='icon' type='image/vnd.microsoft.icon'/>
<link href='http://googlegeodevelopers.blogspot.com/2008/05/introducing-our-geo-developers-blog.html' rel='canonical'/>
<link rel="alternate" type="application/atom+xml" title="Google Geo Developers Blog - Atom" href="http://googlegeodevelopers.blogspot.com/feeds/posts/default" />
<link rel="alternate" type="application/rss+xml" title="Google Geo Developers Blog - RSS" href="http://googlegeodevelopers.blogspot.com/feeds/posts/default?alt=rss" />
<link rel="service.post" type="application/atom+xml" title="Google Geo Developers Blog - Atom" href="http://www.blogger.com/feeds/3124040365160254795/posts/default" />
<link rel="EditURI" type="application/rsd+xml" title="RSD" href="http://www.blogger.com/rsd.g?blogID=3124040365160254795" />
<link rel="alternate" type="application/atom+xml" title="Google Geo Developers Blog - Atom" href="http://googlegeodevelopers.blogspot.com/feeds/1412170371094410255/comments/default" />
<!--[if IE]> <script> (function() { var html5 = ("abbr,article,aside,audio,canvas,datalist,details," + "figure,footer,header,hgroup,mark,menu,meter,nav,output," + "progress,section,time,video").split(','); for (var i = 0; i < html5.length; i++) { doc...
<title>Google Geo Developers Blog: Introducing our Geo Developers Blog</title>
<link href='http://www.google.com/uds/css/gsearch.css' rel='stylesheet' type='text/css'/>
<link href='http://www.google.com/uds/css/gsearch_darkgrey.css' rel='stylesheet' type='text/css'/>
<link href='http://www.google.com/css/gooey.css' rel='stylesheet' type='text/css'/>
<link href='http://www.google.com/googleblogs/css/template_styles.css' rel='stylesheet' type='text/css'/>
<link type='text/css' rel='stylesheet' href='http://www.blogger.com/static/v1/widgets/1892504587-widget_css_bundle.css' />
 <link rel="stylesheet" type="text/css" href="http://www.blogger.com/dyn-css/authorization.css?targetBlogID=3124040365160254795&zx=5391ce60-84d6-4c23-b73f-e9bef1480989"/>
<style type="text/css">#navbar-iframe { display:block }
</style>

<style id='page-skin-1' type='text/css'><!--

#recent_posts span {color: #666; font-size:.85em; padding-top:0; margin-top:0;}
#recent_posts p{margin-bottom:.5em; font-size:1.1em;}
/*
--></style>
<script src='http://www.google.com/uds/api?file=uds.js&v=1.0&key=ABQIAAAA_YJR13Pfd1DLDQs4kgKbQxTxAb0xtwQQCqJhhTH0tdrRSrWJ4RR2PabXite0o1TcEPO2djBsg9GdFg' type='text/javascript'></script>
<script language='Javascript' type='text/javascript'>
var blogURL='http://googlegeodevelopers.blogspot.com/2008/05/introducing-our-geo-developers-blog.html';
 //<![CDATA[
	 var coreSearch;


    function SolutionLoad() {
     var controlRoot = document.getElementById("searchControl");

    // create the search control
    coreSearch = new GSearchControl();
    coreSearch.setLinkTarget(GSearch.LINK_TARGET_SELF);
    coreSearch.setResultSetSize(GSearch.LARGE_RESULTSET);

    // prep for decoupled search form
    var searchFormElement = document.getElementById("searchform");
    var drawOptions = new GdrawOptions();
    drawOptions.setSearchFormRoot(searchFormElement);
    drawOptions.setDrawMode(GSearchControl.DRAW_MODE_TABBED);
  
    // populate - web, this blog, all blogs
    searcher = new GblogSearch();
    searcher.setSiteRestriction('http://googlegeodevelopers.blogspot.com');
    searcher.setUserDefinedLabel("This Blog");
    coreSearch.addSearcher(searcher);
 
    var searcher = new GwebSearch();
    searcher.setUserDefinedLabel("The Web");
    coreSearch.addSearcher(searcher);



( run in 0.361 second using v1.01-cache-2.11-cpan-b50b6a40fd4 )