<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Crawler Research Updates</title>
    <link>http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/</link>
    <description>Updates on the web crawler behavior research project.</description>
    <language>en-us</language>
    <lastBuildDate>2026-02-19T12:00:00Z</lastBuildDate>
    <atom:link href="http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/feed.xml" rel="self" type="application/rss+xml"/>
    <item>
      <title>Research Site Launched</title>
      <link>http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/about.html</link>
      <description>The crawler behavior research site is now live with files of various types.</description>
      <pubDate>2026-02-19T12:00:00Z</pubDate>
      <guid isPermaLink="false">research-2026-02-19</guid>
    </item>
    <item>
      <title>Image Format Tests Added</title>
      <link>http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/about.html</link>
      <description>PNG, JPEG, GIF, SVG, and WebP images have been added to test crawler behavior with binary content.</description>
      <pubDate>2026-02-18T12:00:00Z</pubDate>
      <guid isPermaLink="false">research-2026-02-18</guid>
    </item>
    <item>
      <title>Access Logging Configured</title>
      <link>http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/about.html</link>
      <description>S3 server access logging is now active, capturing timestamp, referrer, and user-agent for every request.</description>
      <pubDate>2026-02-17T12:00:00Z</pubDate>
      <guid isPermaLink="false">research-2026-02-17</guid>
    </item>
    <item>
      <title>Sitemap Published</title>
      <link>http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/about.html</link>
      <description>An XML sitemap has been published listing all files. Observing which crawlers discover and parse it.</description>
      <pubDate>2026-02-16T12:00:00Z</pubDate>
      <guid isPermaLink="false">research-2026-02-16</guid>
    </item>
    <item>
      <title>JavaScript and CSS Added</title>
      <link>http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/about.html</link>
      <description>Substantial JavaScript and CSS files added to test whether crawlers download and parse non-HTML resources.</description>
      <pubDate>2026-02-15T12:00:00Z</pubDate>
      <guid isPermaLink="false">research-2026-02-15</guid>
    </item>
    <item>
      <title>Robots.txt Directives Set</title>
      <link>http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/about.html</link>
      <description>Custom robots.txt with per-crawler directives published. Monitoring compliance across different bots.</description>
      <pubDate>2026-02-14T12:00:00Z</pubDate>
      <guid isPermaLink="false">research-2026-02-14</guid>
    </item>
    <item>
      <title>Data Files Published</title>
      <link>http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/about.html</link>
      <description>JSON and XML data files added. Testing whether crawlers index structured data formats.</description>
      <pubDate>2026-02-13T12:00:00Z</pubDate>
      <guid isPermaLink="false">research-2026-02-13</guid>
    </item>
    <item>
      <title>Extensionless File Test</title>
      <link>http://site4726837462198733423.s3-website-us-east-1.amazonaws.com/about.html</link>
      <description>A configuration file without extension has been added to test Content-Type handling by crawlers.</description>
      <pubDate>2026-02-12T12:00:00Z</pubDate>
      <guid isPermaLink="false">research-2026-02-12</guid>
    </item>
  </channel>
</rss>