<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>SEM WATCH 搜索引擎营销观察 &#187; Baiduspider</title>
	<atom:link href="http://semwatch.org/tag/baiduspider/feed/" rel="self" type="application/rss+xml" />
	<link>http://semwatch.org</link>
	<description>SEMWATCH.org version Beta</description>
	<lastBuildDate>Tue, 17 Apr 2012 01:48:36 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.org/?v=3.0.5</generator>
		<item>
		<title>百度蜘蛛也走后门</title>
		<link>http://semwatch.org/2009/10/baidu-spider-back-door/</link>
		<comments>http://semwatch.org/2009/10/baidu-spider-back-door/#comments</comments>
		<pubDate>Thu, 15 Oct 2009 04:44:48 +0000</pubDate>
		<dc:creator>mutu</dc:creator>
				<category><![CDATA[搜索产业观察]]></category>
		<category><![CDATA[Baiduspider]]></category>
		<category><![CDATA[百度]]></category>

		<guid isPermaLink="false">http://semwatch.org/?p=1166</guid>
		<description><![CDATA[在百度普通的抓取蜘蛛（ Baiduspider ）之外，百度还放养着两类变异的蜘蛛，这两类变异蜘蛛一类称为 cpro，另一类叫做 sfkr，专爬百度的“关系户”。<table class="wumii-related-items" cellspacing="0" cellpadding="3" border="0"  style="clear: both;">
    
    <tr>
        <td colspan="4"><b><font size="-1"  style="display: block !important; padding: 20px 0 5px !important;">您可能也喜欢：</font></b></td>
    </tr>
    
        <tr>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important;">
                    <a target="_blank" title="探一探百度凤巢的巢穴" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F12%2Fbaidu-switched-fengchao%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fbaidu-spider-back-door%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12021508.png" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">探一探百度凤巢的巢穴</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="百度搜索结果首页调整" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F06%2Fbaidu-updates-serp%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fbaidu-spider-back-door%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/14/12158410.png" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">百度搜索结果首页调整</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="老外眼里的百度" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F07%2F%25E8%2580%2581%25E5%25A4%2596%25E7%259C%25BC%25E9%2587%258C%25E7%259A%2584%25E7%2599%25BE%25E5%25BA%25A6%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fbaidu-spider-back-door%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12021527.jpg" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">老外眼里的百度</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="乱谈百度地域性影响因素" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2011%2F05%2Fbaidu-regional-factors%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fbaidu-spider-back-door%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12014845.png" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">乱谈百度地域性影响因素</font>
                    </a>
                </td>
        </tr>
    
    <tr>
        <td colspan="4" align="right">
            <a style="text-decoration: none !important;" href="http://www.wumii.com/widget/relatedItems" target="_blank" title="无觅相关文章插件">
                <font size="-1" color="#bbbbbb" style="display: block !important; font-family: arial !important; padding: 5px 0 !important; font-size: 12px !important; color: #bbb !important;">无觅</font>
            </a>
        </td>
    </tr>
</table>]]></description>
			<content:encoded><![CDATA[<p>在百度普通的抓取蜘蛛（ <a title="百度蜘蛛" href="http://semwatch.org/tag/baiduspider" target="_blank">Baiduspider</a> ）之外，百度还放养着两类变异的蜘蛛，这两类变异蜘蛛一类称为 cpro，另一类叫做 sfkr，专爬百度的“关系户”。</p>
<p><span id="more-1166"></span></p>
<p>所谓关系户是指，给百度直接带来利益的网站，这种利益一是金钱（付费推广的客户）、二是内容资源（内容联盟伙伴）。对待这两类关系户，百度便培育了 cpro 与 sfkr 这两类专走后门的变异蜘蛛。</p>
<p>先来看看百度自己的<a href="http://www.baidu.com/search/spider.html">描述</a>吧！</p>
<p><img class="size-full wp-image-1167  alignright" style="border: 5px solid black;" title="search-spider" src="http://kejiban.com/wp-content/uploads/2009/10/search-spider.jpg" alt="专爬敏感地带的搜索引擎蜘蛛" width="368" height="228" /></p>
<p><em>Baiduspider-cpro：抓取百度联盟会员站点的网页以优化推广效果，只有您的网站加入百度联盟，才会被 cpro 抓取。</em></p>
<p><em>Baiduspider-sfkr：抓取参加百度竞价排名的网页以优化推广效果，只有您的网站参加了竞价排名或其他搜索营销服务，才会被 sfkr 抓取。</em></p>
<p><em>注意：Baiduspider-cpro 和 Baiduspider-sfkr 抓取的网页并不会建入索引，只是执行与客户约定的操作，所以不遵守robots协议。</em></p>
<p>我们该怎样理解百度的变异蜘蛛呢，是为百度系网站提供的福利？还是利益相关者的特殊照顾？其中的“注意”更搞笑，“抓取的网页并不会建入索引，只是执行与客户约定的操作……”这简直是此地无银，不建入索引，只执行操作，那不就等于是给其客户摆样子，随便糊弄一下嘛，瞧我的蜘蛛多勤快呀，仅此而已，那怎么能在客户的面前体现出优化了的推广效果呢？</p>
<p>不管如何，百度还真的称得上是有中国特色的搜索引擎呢，知道所谓的公平与公正都是瞎球扯，只要有商业利益，这个社会有个球的透明与公平。不公平也就罢了，这个世道就是这样，咱也能理解，不过起码还是需要有一些专业精神吧，既然做了就干脆做得赤裸裸一点，写到明处，让大家都知道交了钱或进入联盟能得到的具体照顾：蜘蛛勤快、<a href="http://semwatch.org/">自然搜索结果</a>里显示的机会增多。这样对利益共同体也有个好交代！不过，对外的时候就别再宣称自己多么多么对中小网站一视同仁了，这样真的是几头不讨好，还落了一个“老子是流氓你能拿老子怎么样”的恶嘴脸。</p>
<p>本文首发<a href="http://semwatch.org/"><span> SEM Watch</span></a>，转载请注明出处,欢迎大家留言或者来信（talk[at]SEMWatch.org） ，或者在 twitter 上 <a onclick="pageTracker._trackPageview('/outbound/article/twitter.com');" href="https://twitter.com/semwatch"><span>Follow SEMWATCH </span></a>。懒得翻墙推的，也可以来新浪<a onclick="pageTracker._trackPageview('/outbound/article/t.sina.com.cn');" href="http://t.sina.com.cn/semwatch"><span>围脖我们</span></a>拉。</p>
<table class="wumii-related-items" cellspacing="0" cellpadding="3" border="0"  style="clear: both;">
    
    <tr>
        <td colspan="4"><b><font size="-1"  style="display: block !important; padding: 20px 0 5px !important;">您可能也喜欢：</font></b></td>
    </tr>
    
        <tr>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important;">
                    <a target="_blank" title="探一探百度凤巢的巢穴" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F12%2Fbaidu-switched-fengchao%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fbaidu-spider-back-door%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12021508.png" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">探一探百度凤巢的巢穴</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="百度搜索结果首页调整" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F06%2Fbaidu-updates-serp%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fbaidu-spider-back-door%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/14/12158410.png" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">百度搜索结果首页调整</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="老外眼里的百度" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F07%2F%25E8%2580%2581%25E5%25A4%2596%25E7%259C%25BC%25E9%2587%258C%25E7%259A%2584%25E7%2599%25BE%25E5%25BA%25A6%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fbaidu-spider-back-door%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12021527.jpg" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">老外眼里的百度</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="乱谈百度地域性影响因素" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2011%2F05%2Fbaidu-regional-factors%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fbaidu-spider-back-door%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12014845.png" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">乱谈百度地域性影响因素</font>
                    </a>
                </td>
        </tr>
    
    <tr>
        <td colspan="4" align="right">
            <a style="text-decoration: none !important;" href="http://www.wumii.com/widget/relatedItems" target="_blank" title="无觅相关文章插件">
                <font size="-1" color="#bbbbbb" style="display: block !important; font-family: arial !important; padding: 5px 0 !important; font-size: 12px !important; color: #bbb !important;">无觅</font>
            </a>
        </td>
    </tr>
</table>]]></content:encoded>
			<wfw:commentRss>http://semwatch.org/2009/10/baidu-spider-back-door/feed/</wfw:commentRss>
		<slash:comments>6</slash:comments>
		</item>
		<item>
		<title>Google 每天都会抓取一次 Robots.txt</title>
		<link>http://semwatch.org/2009/09/google-snatch-at-robots-txt-everyday/</link>
		<comments>http://semwatch.org/2009/09/google-snatch-at-robots-txt-everyday/#comments</comments>
		<pubDate>Mon, 07 Sep 2009 12:02:26 +0000</pubDate>
		<dc:creator>Dengshaowei</dc:creator>
				<category><![CDATA[搜索产业观察]]></category>
		<category><![CDATA[Baiduspider]]></category>
		<category><![CDATA[Google]]></category>
		<category><![CDATA[Googlebot]]></category>
		<category><![CDATA[robots]]></category>
		<category><![CDATA[robots.txt]]></category>

		<guid isPermaLink="false">http://semwatch.org/?p=787</guid>
		<description><![CDATA[今天在 Google 帮助论坛上看到了一位 googler 说的关于 robots.txt 的事[download id="null"] Google 通常每天都会来扫描一下 robots.txt 这是印象中 Google员工第一次从官方层面进行表态说 蜘蛛通常每天会来访问robots.txt这个文件 打个比方就 像每天吃饭一样，忽然一顿不吃或者一直没的吃 (饿死了？)，对蜘蛛来说感觉是很不好的。 robots.txt 文件对抓取网络的搜索引擎漫游器（称为漫游器）进行限制。这些漫游器是自动的，在它们访问网页前会查看是否存在限制其访问特定网页的 robots.txt 文件。如果你想保护网站上的某些内容不被搜索引擎收入的话，robots.txt是一个简单有效的工具。 这里举一个robots.txt的例子： User-agent: * Disallow: /cgi-bin/ Disallow: /tmp/ Disallow: /~name/ 其中 User-agent 我知道的有 Baiduspider、Googlebot、msnbot、Yahoo、Sogou、YodaoBot、Sosospider。相信这些名字，大家一看就知道了。 而最新的 Bing.com，据传用的也是 MSNbot，当然还会有一些分类，如 MSNBot-Media 负责图片，MSNBot-NewsBlogs 负责新闻和博客，MSNBot-Products 负责产品和购物车程序等等。 详细的写法，你可以参考一下 Google，依样画一下葫芦：http://www.google.com/robots.txt 本文首发搜索引擎营销观察，转载请注明。<table class="wumii-related-items" cellspacing="0" cellpadding="3" border="0"  style="clear: both;">
    
    <tr>
        <td colspan="4"><b><font size="-1"  style="display: block !important; padding: 20px 0 5px !important;">您可能也喜欢：</font></b></td>
    </tr>
    
        <tr>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important;">
                    <a target="_blank" title="模仿 Googlebot 机器人查看你网页的代码" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fcheck-your-source-code-fetch-as-googlebot%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F09%2Fgoogle-snatch-at-robots-txt-everyday%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12020977.jpg" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">模仿 Googlebot 机器人查看你网页的代码</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="Google Panda 更新那点事" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2011%2F06%2Fgoogle-panda-update%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F09%2Fgoogle-snatch-at-robots-txt-everyday%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/29/15042703.png" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">Google Panda 更新那点事</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="用 site: 查 Google 收录靠谱吗？" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F11%2Fhow-inaccurate-google-site-operator-is-and-how-to-fix-it%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F09%2Fgoogle-snatch-at-robots-txt-everyday%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12088199.jpg" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">用 site: 查 Google 收录靠谱吗？</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="时代精神2010-Google之一年一回头" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2010%2F12%2F%25E6%2597%25B6%25E4%25BB%25A3%25E7%25B2%25BE%25E7%25A5%259E2010-google%25E4%25B9%258B%25E4%25B8%2580%25E5%25B9%25B4%25E4%25B8%2580%25E5%259B%259E%25E5%25A4%25B4-2%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F09%2Fgoogle-snatch-at-robots-txt-everyday%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12025866.gif" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">时代精神2010-Google之一年一回头</font>
                    </a>
                </td>
        </tr>
    
    <tr>
        <td colspan="4" align="right">
            <a style="text-decoration: none !important;" href="http://www.wumii.com/widget/relatedItems" target="_blank" title="无觅相关文章插件">
                <font size="-1" color="#bbbbbb" style="display: block !important; font-family: arial !important; padding: 5px 0 !important; font-size: 12px !important; color: #bbb !important;">无觅</font>
            </a>
        </td>
    </tr>
</table>]]></description>
			<content:encoded><![CDATA[<p>今天在<a href="http://www.google.com/support/forum/p/Webmasters/thread?tid=04fb6fef83409914&amp;hl=en"> Google 帮助论坛上看到了</a>一位 googler 说的关于 robots.txt 的事[download id="null"]<span id="more-787"></span></p>
<blockquote><p>Google 通常每天都会来扫描一下 robots.txt</p></blockquote>
<p>这是印象中 Google员工<strong>第一次</strong>从<strong>官方层面</strong>进行表态说 蜘蛛通常<strong>每天会来访问robots.txt</strong>这个文件</p>
<p>打个比方就 像每天吃饭一样，忽然一顿不吃或者一直没的吃 (饿死了？)，对蜘蛛来说感觉是很不好的。</p>
<p>robots.txt 文件对抓取网络的搜索引擎漫游器（称为漫游器）进行限制。这些漫游器是自动的，在它们访问网页前会查看是否存在限制其访问特定网页的  robots.txt 文件。如果你想保护网站上的某些内容不被搜索引擎收入的话，robots.txt是一个简单有效的工具。</p>
<p><span style="font-size: 100%;">这里举一个</span><span style="font-size: 100%;">robots.txt的例子：</span></p>
<p><span style="font-size: 100%;"></p>
<blockquote>
<pre>User-agent: *
Disallow: /cgi-bin/
Disallow: /tmp/
Disallow: /~name/</pre>
</blockquote>
<p></span></p>
<p><span style="font-size: 100%;"><span style="background-color: #ffffff;">其中 User-agent 我知道的有 Baiduspider、Googlebot、msnbot、Yahoo、Sogou、YodaoBot、Sosospider。相信这些名字，大家一看就知道了。</span></span></p>
<p>而最新的 Bing.com，据传用的也是 MSNbot，当然还会有一些分类，如 MSNBot-Media 负责图片，MSNBot-NewsBlogs 负责新闻和博客，MSNBot-Products 负责产品和购物车程序等等。</p>
<p>详细的写法，你可以参考一下 Google，依样画一下葫芦：http://www.google.com/robots.txt</p>
<p>本文首发<a href="http://semwatch.org">搜索引擎营销</a>观察，转载请注明。</p>
<table class="wumii-related-items" cellspacing="0" cellpadding="3" border="0"  style="clear: both;">
    
    <tr>
        <td colspan="4"><b><font size="-1"  style="display: block !important; padding: 20px 0 5px !important;">您可能也喜欢：</font></b></td>
    </tr>
    
        <tr>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important;">
                    <a target="_blank" title="模仿 Googlebot 机器人查看你网页的代码" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F10%2Fcheck-your-source-code-fetch-as-googlebot%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F09%2Fgoogle-snatch-at-robots-txt-everyday%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12020977.jpg" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">模仿 Googlebot 机器人查看你网页的代码</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="Google Panda 更新那点事" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2011%2F06%2Fgoogle-panda-update%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F09%2Fgoogle-snatch-at-robots-txt-everyday%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/29/15042703.png" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">Google Panda 更新那点事</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="用 site: 查 Google 收录靠谱吗？" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2009%2F11%2Fhow-inaccurate-google-site-operator-is-and-how-to-fix-it%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F09%2Fgoogle-snatch-at-robots-txt-everyday%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12088199.jpg" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">用 site: 查 Google 收录靠谱吗？</font>
                    </a>
                </td>
                <td width="102" valign="top" style="padding: 5px !important; margin: 0 !important; border-left: 1px solid #DDDDDD !important;">
                    <a target="_blank" title="时代精神2010-Google之一年一回头" style="text-decoration: none !important; cursor: pointer !important;" href="http://app.wumii.com/ext/redirect?url=http%3A%2F%2Fsemwatch.org%2F2010%2F12%2F%25E6%2597%25B6%25E4%25BB%25A3%25E7%25B2%25BE%25E7%25A5%259E2010-google%25E4%25B9%258B%25E4%25B8%2580%25E5%25B9%25B4%25E4%25B8%2580%25E5%259B%259E%25E5%25A4%25B4-2%2F&from=http%3A%2F%2Fsemwatch.org%2F2009%2F09%2Fgoogle-snatch-at-robots-txt-everyday%2F">
                        <img style="margin: 0 !important; padding: 2px !important; border: 1px solid #DDDDDD !important; width: 96px !important; height: 96px !important;" src="http://static.wumii.com/site_images/2011/06/13/12025866.gif" width="96px" height="96px" /><br />
                        <font size="-1" color="#333333" style="display: block !important; line-height: 15px !important; width: 102px !important; font: 12px/15px arial !important; height: 60px !important; margin: 3px 0 0 0 !important; padding: 0 !important; overflow: hidden !important;">时代精神2010-Google之一年一回头</font>
                    </a>
                </td>
        </tr>
    
    <tr>
        <td colspan="4" align="right">
            <a style="text-decoration: none !important;" href="http://www.wumii.com/widget/relatedItems" target="_blank" title="无觅相关文章插件">
                <font size="-1" color="#bbbbbb" style="display: block !important; font-family: arial !important; padding: 5px 0 !important; font-size: 12px !important; color: #bbb !important;">无觅</font>
            </a>
        </td>
    </tr>
</table>]]></content:encoded>
			<wfw:commentRss>http://semwatch.org/2009/09/google-snatch-at-robots-txt-everyday/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
	</channel>
</rss>

