<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Geo-reference data in MS Word, PowerPoint, PDF in Esri Geoportal Server Questions</title>
    <link>https://community.esri.com/t5/esri-geoportal-server-questions/geo-reference-data-in-ms-word-powerpoint-pdf/m-p/478530#M604</link>
    <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;to do this, you will need to extend the harvesting framework and for example &lt;A href="http://tika.apache.org/" target="_blank"&gt;Apache Tika&lt;/A&gt;. A description of &lt;A href="https://github.com/Esri/geoportal-server/wiki/Extending-the-Web-Harvester" target="_blank"&gt;how to extend the metadata harvester&lt;/A&gt; is given on the Geoportal Server wiki. I have attached some code I have been working on to do exactly this. Using Tika, it reads the metadata from the documents (such as Office/PDF document properties) into a Dublin Core XML structure. My next step was to see if I could geolocate places based on accessing a gazetteer with place names. I'd be happy to collaborate on further developing this and adding it to Geoportal Server as a feature.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
    <pubDate>Mon, 28 Jul 2014 08:49:59 GMT</pubDate>
    <dc:creator>MartenHogeweg</dc:creator>
    <dc:date>2014-07-28T08:49:59Z</dc:date>
    <item>
      <title>Geo-reference data in MS Word, PowerPoint, PDF</title>
      <link>https://community.esri.com/t5/esri-geoportal-server-questions/geo-reference-data-in-ms-word-powerpoint-pdf/m-p/478529#M603</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;SPAN&gt;Good Afternoon,&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;STRONG&gt;Question&lt;/STRONG&gt;&lt;SPAN&gt;: Does Geoportal Server support the search and retrieval of Geo-referenced data embedded in MS Word, PowerPoint, and plain-text documents?&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN&gt;Appreciate your insight and suggestions.&lt;/SPAN&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Thu, 24 Apr 2014 17:08:17 GMT</pubDate>
      <guid>https://community.esri.com/t5/esri-geoportal-server-questions/geo-reference-data-in-ms-word-powerpoint-pdf/m-p/478529#M603</guid>
      <dc:creator>StephenCoppola</dc:creator>
      <dc:date>2014-04-24T17:08:17Z</dc:date>
    </item>
    <item>
      <title>Re: Geo-reference data in MS Word, PowerPoint, PDF</title>
      <link>https://community.esri.com/t5/esri-geoportal-server-questions/geo-reference-data-in-ms-word-powerpoint-pdf/m-p/478530#M604</link>
      <description>&lt;HTML&gt;&lt;HEAD&gt;&lt;/HEAD&gt;&lt;BODY&gt;&lt;P&gt;to do this, you will need to extend the harvesting framework and for example &lt;A href="http://tika.apache.org/" target="_blank"&gt;Apache Tika&lt;/A&gt;. A description of &lt;A href="https://github.com/Esri/geoportal-server/wiki/Extending-the-Web-Harvester" target="_blank"&gt;how to extend the metadata harvester&lt;/A&gt; is given on the Geoportal Server wiki. I have attached some code I have been working on to do exactly this. Using Tika, it reads the metadata from the documents (such as Office/PDF document properties) into a Dublin Core XML structure. My next step was to see if I could geolocate places based on accessing a gazetteer with place names. I'd be happy to collaborate on further developing this and adding it to Geoportal Server as a feature.&lt;/P&gt;&lt;/BODY&gt;&lt;/HTML&gt;</description>
      <pubDate>Mon, 28 Jul 2014 08:49:59 GMT</pubDate>
      <guid>https://community.esri.com/t5/esri-geoportal-server-questions/geo-reference-data-in-ms-word-powerpoint-pdf/m-p/478530#M604</guid>
      <dc:creator>MartenHogeweg</dc:creator>
      <dc:date>2014-07-28T08:49:59Z</dc:date>
    </item>
  </channel>
</rss>

