<?xml version="1.0" encoding="UTF-8"?>
<blog-post>
  <author-id type="integer">68581</author-id>
  <blog-comments-count type="integer">1</blog-comments-count>
  <blog-post-status-id type="integer">3</blog-post-status-id>
  <body-format>econsultancy_xml</body-format>
  <body-formatted>
  &lt;p&gt;
    &lt;a href="http://googlewebmastercentral.blogspot.com/2008/04/crawling-through-html-forms.html"&gt;According to Google&lt;/a&gt;, the Googlebot is able to follow web forms using both text box inputs and drop down or select boxes. &lt;/p&gt;
  &lt;p&gt;For select menus and radio buttons Google will choose values from the html and submit the form (it only does this with GET forms) to see if the results are something that might be helpful to searchers.&lt;/p&gt;
  &lt;p&gt;This strategy is quite straightforward and will help Google index a lot of the &lt;em&gt;"invisible"&lt;/em&gt; web that exists behind these forms.&lt;/p&gt;
  &lt;p&gt;The interesting part of the new system is when Google fills in a search box on a site using a made up query. &lt;/p&gt;
  &lt;p&gt;Googlebot is able to generate queries that&#160;it thinks might be relevant to their users (or queries where they don't have many results at present) and enter these queries into a search box to try and find more results.&lt;/p&gt;
  &lt;p&gt;Essentially Google is automatically generating queries and performing those queries on internal search engines on millions of websites to see what&#160;it can find.&lt;/p&gt;
  &lt;p&gt;Webmasters are already spotting this and some are concerned about the content being indexed as well as increased server load.&lt;/p&gt;
</body-formatted>
  <body-unformatted>&lt;FormattedContent xmlns="http://www.e-consultancy.com/schema/formattedContent/"&gt;
  &lt;Paragraph&gt;
    &lt;Link URL="http://googlewebmastercentral.blogspot.com/2008/04/crawling-through-html-forms.html" Window="Self"&gt;According to Google&lt;/Link&gt;, the Googlebot is able to follow web forms using both text box inputs and drop down or select boxes. &lt;/Paragraph&gt;
  &lt;Paragraph&gt;For select menus and radio buttons Google will choose values from the html and submit the form (it only does this with GET forms) to see if the results are something that might be helpful to searchers.&lt;/Paragraph&gt;
  &lt;Paragraph&gt;This strategy is quite straightforward and will help Google index a lot of the &lt;Quote&gt;"invisible"&lt;/Quote&gt; web that exists behind these forms.&lt;/Paragraph&gt;
  &lt;Paragraph&gt;The interesting part of the new system is when Google fills in a search box on a site using a made up query. &lt;/Paragraph&gt;
  &lt;Paragraph&gt;Googlebot is able to generate queries that&#160;it thinks might be relevant to their users (or queries where they don't have many results at present) and enter these queries into a search box to try and find more results.&lt;/Paragraph&gt;
  &lt;Paragraph&gt;Essentially Google is automatically generating queries and performing those queries on internal search engines on millions of websites to see what&#160;it can find.&lt;/Paragraph&gt;
  &lt;Paragraph&gt;Webmasters are already spotting this and some are concerned about the content being indexed as well as increased server load.&lt;/Paragraph&gt;
&lt;/FormattedContent&gt;</body-unformatted>
  <created-at type="datetime">2008-04-14T11:53:00+01:00</created-at>
  <enabled-blog-comments-count type="integer">0</enabled-blog-comments-count>
  <expertise-level-id type="integer">1</expertise-level-id>
  <extract-format>econsultancy_xml</extract-format>
  <extract-formatted>
  &lt;p&gt;
    &lt;strong&gt;Last year Google was &lt;/strong&gt;
    &lt;a href="http://searchengineland.com/070312-104201.php"&gt;
      &lt;strong&gt;warning&lt;/strong&gt;
    &lt;/a&gt;
    &lt;strong&gt;webmasters that search results were not welcome in their index. &lt;/strong&gt;
  &lt;/p&gt;
  &lt;p&gt;Last week&#160;it started generating&#160;its own search results from websites by filling in html forms. &lt;em&gt;What's going on?&lt;/em&gt;&lt;/p&gt;
</extract-formatted>
  <extract-unformatted>&lt;FormattedContent xmlns="http://www.e-consultancy.com/schema/formattedContent/"&gt;
  &lt;Paragraph&gt;
    &lt;Emphasis&gt;Last year Google was &lt;/Emphasis&gt;
    &lt;Link URL="http://searchengineland.com/070312-104201.php" Window="Self"&gt;
      &lt;Emphasis&gt;warning&lt;/Emphasis&gt;
    &lt;/Link&gt;
    &lt;Emphasis&gt;webmasters that search results were not welcome in their index. &lt;/Emphasis&gt;
  &lt;/Paragraph&gt;
  &lt;Paragraph&gt;Last week&#160;it started generating&#160;its own search results from websites by filling in html forms. &lt;Quote&gt;What's going on?&lt;/Quote&gt;&lt;/Paragraph&gt;
&lt;/FormattedContent&gt;</extract-unformatted>
  <featured type="boolean">false</featured>
  <id type="integer">2364</id>
  <learn-more-formatted nil="true"></learn-more-formatted>
  <learn-more-unformatted nil="true"></learn-more-unformatted>
  <legacy-article-id type="integer">365438</legacy-article-id>
  <name>Google wants to index your invisible content</name>
  <private type="boolean">false</private>
  <published-at type="datetime">2008-04-14T12:50:00+01:00</published-at>
  <slug>google-wants-to-index-your-invisible-content</slug>
  <tweetbacks-updated-at type="datetime">2009-04-28T23:08:28+01:00</tweetbacks-updated-at>
  <unpublished-at type="datetime" nil="true"></unpublished-at>
  <updated-at type="datetime">2009-04-28T23:08:28+01:00</updated-at>
  <views-count type="integer">427</views-count>
</blog-post>
