Alvis-Convert

 view release on metacpan or  search on metacpan

lib/Alvis/Document/Encoding.pm  view on Meta::CPAN

 55331=>1,  55332=>1,  55333=>1,  55334=>1,  55335=>1,  55336=>1,  55337=>1, 
 55338=>1,  55339=>1,  55340=>1,  55341=>1,  55342=>1,  55343=>1,  55344=>1, 
 55345=>1,  55346=>1,  55347=>1,  55348=>1,  55349=>1,  55350=>1,  55351=>1, 
 55352=>1,  55353=>1,  55354=>1,  55355=>1,  55356=>1,  55357=>1,  55358=>1, 
 55359=>1,  55360=>1,  55361=>1,  55362=>1,  55363=>1,  55364=>1,  55365=>1, 
 55366=>1,  55367=>1,  55368=>1,  55369=>1,  55370=>1,  55371=>1,  55372=>1, 
 55373=>1,  55374=>1,  55375=>1,  55376=>1,  55377=>1,  55378=>1,  55379=>1, 
 55380=>1,  55381=>1,  55382=>1,  55383=>1,  55384=>1,  55385=>1,  55386=>1, 
 55387=>1,  55388=>1,  55389=>1,  55390=>1,  55391=>1,  55392=>1,  55393=>1, 
 55394=>1,  55395=>1,  55396=>1,  55397=>1,  55398=>1,  55399=>1,  55400=>1, 
 55401=>1,  55402=>1,  55403=>1,  55404=>1,  55405=>1,  55406=>1,  55407=>1, 
 55408=>1,  55409=>1,  55410=>1,  55411=>1,  55412=>1,  55413=>1,  55414=>1, 
 55415=>1,  55416=>1,  55417=>1,  55418=>1,  55419=>1,  55420=>1,  55421=>1, 
 55422=>1,  55423=>1,  55424=>1,  55425=>1,  55426=>1,  55427=>1,  55428=>1, 
 55429=>1,  55430=>1,  55431=>1,  55432=>1,  55433=>1,  55434=>1,  55435=>1, 
 55436=>1,  55437=>1,  55438=>1,  55439=>1,  55440=>1,  55441=>1,  55442=>1, 
 55443=>1,  55444=>1,  55445=>1,  55446=>1,  55447=>1,  55448=>1,  55449=>1, 
 55450=>1,  55451=>1,  55452=>1,  55453=>1,  55454=>1,  55455=>1,  55456=>1, 
 55457=>1,  55458=>1,  55459=>1,  55460=>1,  55461=>1,  55462=>1,  55463=>1, 
 55464=>1,  55465=>1,  55466=>1,  55467=>1,  55468=>1,  55469=>1,  55470=>1, 
 55471=>1,  55472=>1,  55473=>1,  55474=>1,  55475=>1,  55476=>1,  55477=>1, 

lib/Alvis/Document/Encoding.pm  view on Meta::CPAN

 56332=>1,  56333=>1,  56334=>1,  56335=>1,  56336=>1,  56337=>1,  56338=>1, 
 56339=>1,  56340=>1,  56341=>1,  56342=>1,  56343=>1,  56344=>1,  56345=>1, 
 56346=>1,  56347=>1,  56348=>1,  56349=>1,  56350=>1,  56351=>1,  56352=>1, 
 56353=>1,  56354=>1,  56355=>1,  56356=>1,  56357=>1,  56358=>1,  56359=>1, 
 56360=>1,  56361=>1,  56362=>1,  56363=>1,  56364=>1,  56365=>1,  56366=>1, 
 56367=>1,  56368=>1,  56369=>1,  56370=>1,  56371=>1,  56372=>1,  56373=>1, 
 56374=>1,  56375=>1,  56376=>1,  56377=>1,  56378=>1,  56379=>1,  56380=>1, 
 56381=>1,  56382=>1,  56383=>1,  56384=>1,  56385=>1,  56386=>1,  56387=>1, 
 56388=>1,  56389=>1,  56390=>1,  56391=>1,  56392=>1,  56393=>1,  56394=>1, 
 56395=>1,  56396=>1,  56397=>1,  56398=>1,  56399=>1,  56400=>1,  56401=>1, 
 56402=>1,  56403=>1,  56404=>1,  56405=>1,  56406=>1,  56407=>1,  56408=>1, 
 56409=>1,  56410=>1,  56411=>1,  56412=>1,  56413=>1,  56414=>1,  56415=>1, 
 56416=>1,  56417=>1,  56418=>1,  56419=>1,  56420=>1,  56421=>1,  56422=>1, 
 56423=>1,  56424=>1,  56425=>1,  56426=>1,  56427=>1,  56428=>1,  56429=>1, 
 56430=>1,  56431=>1,  56432=>1,  56433=>1,  56434=>1,  56435=>1,  56436=>1, 
 56437=>1,  56438=>1,  56439=>1,  56440=>1,  56441=>1,  56442=>1,  56443=>1, 
 56444=>1,  56445=>1,  56446=>1,  56447=>1,  56448=>1,  56449=>1,  56450=>1, 
 56451=>1,  56452=>1,  56453=>1,  56454=>1,  56455=>1,  56456=>1,  56457=>1, 
 56458=>1,  56459=>1,  56460=>1,  56461=>1,  56462=>1,  56463=>1,  56464=>1, 
 56465=>1,  56466=>1,  56467=>1,  56468=>1,  56469=>1,  56470=>1,  56471=>1, 
 56472=>1,  56473=>1,  56474=>1,  56475=>1,  56476=>1,  56477=>1,  56478=>1, 

t/test-data/to-split/29.xml  view on Meta::CPAN

      <semantic_unit><named_entity><form>Google</form><named_entity_type>soft</named_entity_type></named_entity></semantic_unit>
      <semantic_unit><named_entity><form>Google Search</form><named_entity_type>soft</named_entity_type></named_entity></semantic_unit>
      <semantic_unit><named_entity><form>Google Video</form><named_entity_type>soft</named_entity_type></named_entity></semantic_unit>
    </semantic_unit_level>
  </linguisticAnalysis>

  </documentRecord>
<documentRecord id="7F0D97BDACC9D73DA79364ADF93A9080" xmlns="http://alvis.info/enriched/">
    <acquisition>
      <acquisitionData>
        <modifiedDate>1144768340466</modifiedDate>
        <httpServer>Apache/1.3.28 (Unix) mod_gzip/1.3.26.1a PHP/4.3.10 mod_ssl/2.8.15 OpenSSL/0.9.7c</httpServer>
        <urls>
          <url>http://www.seroundtable.com/archives/003639.html</url>
        </urls>
      </acquisitionData>
      <canonicalDocument>        
        <section>There is a DigitalPoint Forum thread named that discusses a neat PageRank tool at http://www.webmastereyes.com/. The PageRank tool is different from others, in that it will enable you to plug in a URL and it will then place graphical...
      <metaData>
        <meta name="title">New Google PageRank Tool Plots PR Values Overlays On Page</meta>
        <meta name="dc:date">Tue, 11 Apr 2006 12:40:49 GMT</meta>



( run in 2.149 seconds using v1.01-cache-2.11-cpan-39bf76dae61 )