<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>Internet Business &#38; Marketing Strategy - Andy Beard &#187; duplicate content</title>
	<atom:link href="http://andybeard.eu/tag/duplicate-content/feed" rel="self" type="application/rss+xml" />
	<link>http://andybeard.eu</link>
	<description>Internet Marketing, Lead Acquisition, Online Business Strategy and Social Media with Original Opinion and Loads of Attitude</description>
	<lastBuildDate>Sun, 12 Feb 2012 06:16:17 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	
		<item>
		<title>How a Blogroll Can Still Kill Your PageRank</title>
		<link>http://andybeard.eu/121/how-a-blogroll-can-kill-your-pagerank.html</link>
		<comments>http://andybeard.eu/121/how-a-blogroll-can-kill-your-pagerank.html#comments</comments>
		<pubDate>Sun, 08 Aug 2010 10:00:42 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[blogging tips]]></category>
		<category><![CDATA[SEO Blog]]></category>
		<category><![CDATA[article marketing]]></category>
		<category><![CDATA[Article Submission]]></category>
		<category><![CDATA[articles]]></category>
		<category><![CDATA[backlinks]]></category>
		<category><![CDATA[Better Blogging]]></category>
		<category><![CDATA[blog]]></category>
		<category><![CDATA[Blog Navigation]]></category>
		<category><![CDATA[blogging]]></category>
		<category><![CDATA[Blogroll]]></category>
		<category><![CDATA[comments]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[Dynamic Linking]]></category>
		<category><![CDATA[folksonomy]]></category>
		<category><![CDATA[how to]]></category>
		<category><![CDATA[howto]]></category>
		<category><![CDATA[linking strategy]]></category>
		<category><![CDATA[mininet]]></category>
		<category><![CDATA[nofollow]]></category>
		<category><![CDATA[revenge of the mininet]]></category>
		<category><![CDATA[search engines]]></category>
		<category><![CDATA[Site Navigation]]></category>
		<category><![CDATA[ultimate tag warrior]]></category>
		<category><![CDATA[utw]]></category>
		<category><![CDATA[website traffic]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2006/11/how-a-blogroll-can-kill-your-pagerank.html</guid>
		<description><![CDATA[
<p>Navigational elements on a blog or any website are an important feature, but you should be careful not to take things to extremes which can hurt the progress of your site, both from a SEO perspective and for website conversion.</p>
<p><a href="http://andybeard.eu/121/how-a-blogroll-can-kill-your-pagerank.html" class="more-link">Read more on How a Blogroll Can Still Kill Your PageRank&#8230;</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F121%252Fhow-a-blogroll-can-kill-your-pagerank.html%22%2C%20%22shorturl%22%3A%20%22http%3A%2F%2Fbit.ly%2FajXhVi%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22How%20a%20Blogroll%20Can%20Still%20Kill%20Your%20PageRank%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/article-marketing" title="article marketing" rel="tag">article marketing</a>, <a href="http://andybeard.eu/tag/article-submission" title="Article Submission" rel="tag">Article Submission</a>, <a href="http://andybeard.eu/tag/articles" title="articles" rel="tag">articles</a>, <a href="http://andybeard.eu/tag/backlinks" title="backlinks" rel="tag">backlinks</a>, <a href="http://andybeard.eu/tag/better-blogging" title="Better Blogging" rel="tag">Better Blogging</a>, <a href="http://andybeard.eu/tag/blog" title="blog" rel="tag">blog</a>, <a href="http://andybeard.eu/tag/blog-navigation" title="Blog Navigation" rel="tag">Blog Navigation</a>, <a href="http://andybeard.eu/tag/blogging" title="blogging" rel="tag">blogging</a>, <a href="http://andybeard.eu/tag/blogging-tips" title="blogging tips" rel="tag">blogging tips</a>, <a href="http://andybeard.eu/tag/blogroll" title="Blogroll" rel="tag">Blogroll</a>, <a href="http://andybeard.eu/tag/comments" title="comments" rel="tag">comments</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/dynamic-linking" title="Dynamic Linking" rel="tag">Dynamic Linking</a>, <a href="http://andybeard.eu/tag/folksonomy" title="folksonomy" rel="tag">folksonomy</a>, <a href="http://andybeard.eu/tag/how-to" title="how to" rel="tag">how to</a>, <a href="http://andybeard.eu/tag/howto" title="howto" rel="tag">howto</a>, <a href="http://andybeard.eu/tag/linking-strategy" title="linking strategy" rel="tag">linking strategy</a>, <a href="http://andybeard.eu/tag/mininet" title="mininet" rel="tag">mininet</a>, <a href="http://andybeard.eu/tag/nofollow" title="nofollow" rel="tag">nofollow</a>, <a href="http://andybeard.eu/tag/revenge-of-the-mininet" title="revenge of the mininet" rel="tag">revenge of the mininet</a>, <a href="http://andybeard.eu/tag/search-engines" title="search engines" rel="tag">search engines</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/site-navigation" title="Site Navigation" rel="tag">Site Navigation</a>, <a href="http://andybeard.eu/tag/ultimate-tag-warrior" title="ultimate tag warrior" rel="tag">ultimate tag warrior</a>, <a href="http://andybeard.eu/tag/utw" title="utw" rel="tag">utw</a>, <a href="http://andybeard.eu/tag/website-traffic" title="website traffic" rel="tag">website traffic</a><br />
]]></description>
			<content:encoded><![CDATA[
<p>Navigational elements on a blog or any website are an important feature, but you should be careful not to take things to extremes which can hurt the progress of your site, both from a SEO perspective and for website conversion.</p>
<p><strong>This post was originally posted Nov 7, 2006 &#8211; I have added a screenshot as the original subject site is no longer online &#8211; it is still just as relevant today as it was over 3 years ago. In places I have added some additional commentary or expanded on original ideas.</strong></p>
<p>References to PageRank should be looked on as synonymous with Google Juice &#038; overall site authority, and not just green pixels in a toolbar, though that can be a good visual indicator at times.</p>
<h3>How a Blogroll can kill your PageRank</h3>
<p>I followed a link from Digg a few minutes a go, read the story, and as I frequently do on any site I visit, I snooped around a little.</p>
<p>I actually do exactly the same every time someone writes a blog post referring to me and pings my blog.  It is the polite thing to do, and maybe I can add something to the conversation. It also allows me to relate any comment to the person who is writing about me, either positively or negatively. Everyone is entitled to opposing views. What is often important is why they have an opposing view, and it isn&#8217;t always obvious.</p>
<p>Now about the site in question:</p>
<ol>
<li>I have only read half of one article there, so I don&#8217;t know much about the site contents</li>
<li>The reason I am linking through to the site is purely from an SEO point of view</li>
<li>This is a very common problem, very easy to make, and honestly not too hard to correct.</li>
</ol>
<p>With that said, here is the site <a class="external" href="http://web.archive.org/web/20061108073352/http://kerryfoxlive.com/wordpress/">Kerry Fox Live</a> (Archive.org link &#8211; the site seems to have been offline for 2 years.)</p>
<h3><strong>Initial Site Analysis</strong></h3>
<p>So the first thing I notice is that it is a PR3 site.</p>
<p>The internal categories are mainly PR2</p>
<p>The archives are mainly PR2</p>
<p>The individual post pages are generally PR1 or unranked</p>
<p>A large proportion of the content is duplicate syndicated content from services such as Associated Press, without any wrapping</p>
<p><strong>But the site has been around for 16 months</strong></p>
<p>You can make a splog, chuck duplicate content at it, and get a PR4 or PR5 after a few months.</p>
<h3>So what is wrong with the site?</h3>
<p><img class="alignleft size-full wp-image-2860" title="Blogroll from " src="http://cdn5.andybeard.name/wp-content/uploads/Blogroll.png" alt="blogroll example" width="293" height="1000" />Take a look at the sidebar</p>
<p>At a guess (I am seriously not going to count them all), only 20% of the links on any given page point to an internal page. (yes that sidebar is on every page)<br />
There are 2 blogrolls, one of which seems to be websites and blogs he likes, and the other is a whole load of press related sites&#8230; news sources.</p>
<p>Every single one of those links is a live external link leaking PageRank to other sites. Those other sites are not reciprocating in any way.</p>
<p>Now I am sure someone is likely to point out that  those links provide a service for visitors, and maybe add a little authenticity to the site.</p>
<h3><strong>What visitors?</strong></h3>
<p>We are looking at a news site with an Alexa rank of close to 2M &#8211; not 2k, but 2M</p>
<p>Now there are times you want to sacrifice a little page rank to other sites, especially if they are reciprocating, sharing visitors, or in the case of my blog, I like visitors commenting and joing my &#8220;community&#8221;. You might also do it in a carefully controlled way from a mininet to one of your own sites.</p>
<h3>Solutions</h3>
<p>Get rid of the blogroll on all internal pages. It is giving away too much traffic to other sites, not to mention PageRank.</p>
<p><span style="text-decoration: line-through;">Add nofollow to all the blogroll links that are not reciprocating, or you don&#8217;t want to be overly friendly with.</span> (Update August 2010 I would probably tend to use javascript in some way)</p>
<p>Increase internal linking to compensate for all the leakage.</p>
<h3>How to Increase Internal Linking</h3>
<ul>
<li>Recent posts &#8211; 10 links</li>
<li>Top Posts &#8211; 10 links</li>
<li>Recent Comments &#8211; 5 &#8211; 10 links</li>
<li>Tagging + Tag Cloud &#8211; 50+ links</li>
<li>There wouldn&#8217;t be a need for as much internal ball linking if there wasn&#8217;t so many external leaks. The site is gaining very few comments.</li>
<li>Related posts &#8211; 5-10 links</li>
<li>Related reviews &#8211; 5-10 links</li>
<li>Glossary links</li>
</ul>
<p>Emphasis should be placed on the links you wish visitors to traverse</p>
<h3>External Linking</h3>
<p>The site has 2 visible external links to the front page. I am not sure how many to internal pages, but even if it did have external links, any PR given would immediate leak.</p>
<p>Just syndicating one article will generate loads of backlinks, far in excess of what you can achieve with a single blog post (unless you have 100k+ readers). Based on my analysis of &#8220;A&#8221; list bloggers, their average blog post might normally generate around 10 backlinks (showing in Google).</p>
<p>(update August 2010: &#8211; whilst many of the bloggers I analysed in 2006 have 10x as many subscribers by RSS &amp; email now, the number of links they receive, other than from splogs &amp; social media probably hasn&#8217;t increased)</p>
<h3>Conclusion</h3>
<p>It is not rocket science, just simple maths.</p>
<p>If you have 100 external links on every page of your site, you need lot of internal links to retain some (hopefully most) of your PageRank, and it would certain help if  those people you give a link to on your sidebar reciprocate in some manner.</p>
<p><strong>(please note that includes me &#8211; don&#8217;t put a link in your blogroll to my site &#8211; sure I appreciate the links, but I would much prefer just an occasional mention in your blog)</strong></p>
<p>If you can&#8217;t get a reciprocal link, use <span style="text-decoration: line-through;">nofollow</span>, (August 2010 &#8211; blocked external javascript), or stick them on their own seperate page so they don&#8217;t suck your own site dry.</p>
<p>And finally&#8230; this site structure plagues a huge proportion of blogs. Other blog owners who do not have this problem, quite likely don&#8217;t even realise why.</p>
<p>Further reading:</p>
<p><a href="http://andybeard.eu/2006/10/revenge-of-the-mininet-3rd-party-content-blog-comments-no-follow.html">Revenge of the Mininet | 3rd Party content | Blog Comments | No Follow</a></p>
<p>Update: whilst I am still a fan of article marketing, I no longer recommend any service that doesn&#8217;t provide a way to have unique passwords for each distribution site.</p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F121%252Fhow-a-blogroll-can-kill-your-pagerank.html%22%2C%20%22shorturl%22%3A%20%22http%3A%2F%2Fbit.ly%2FajXhVi%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22How%20a%20Blogroll%20Can%20Still%20Kill%20Your%20PageRank%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/article-marketing" title="article marketing" rel="tag">article marketing</a>, <a href="http://andybeard.eu/tag/article-submission" title="Article Submission" rel="tag">Article Submission</a>, <a href="http://andybeard.eu/tag/articles" title="articles" rel="tag">articles</a>, <a href="http://andybeard.eu/tag/backlinks" title="backlinks" rel="tag">backlinks</a>, <a href="http://andybeard.eu/tag/better-blogging" title="Better Blogging" rel="tag">Better Blogging</a>, <a href="http://andybeard.eu/tag/blog" title="blog" rel="tag">blog</a>, <a href="http://andybeard.eu/tag/blog-navigation" title="Blog Navigation" rel="tag">Blog Navigation</a>, <a href="http://andybeard.eu/tag/blogging" title="blogging" rel="tag">blogging</a>, <a href="http://andybeard.eu/tag/blogging-tips" title="blogging tips" rel="tag">blogging tips</a>, <a href="http://andybeard.eu/tag/blogroll" title="Blogroll" rel="tag">Blogroll</a>, <a href="http://andybeard.eu/tag/comments" title="comments" rel="tag">comments</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/dynamic-linking" title="Dynamic Linking" rel="tag">Dynamic Linking</a>, <a href="http://andybeard.eu/tag/folksonomy" title="folksonomy" rel="tag">folksonomy</a>, <a href="http://andybeard.eu/tag/how-to" title="how to" rel="tag">how to</a>, <a href="http://andybeard.eu/tag/howto" title="howto" rel="tag">howto</a>, <a href="http://andybeard.eu/tag/linking-strategy" title="linking strategy" rel="tag">linking strategy</a>, <a href="http://andybeard.eu/tag/mininet" title="mininet" rel="tag">mininet</a>, <a href="http://andybeard.eu/tag/nofollow" title="nofollow" rel="tag">nofollow</a>, <a href="http://andybeard.eu/tag/revenge-of-the-mininet" title="revenge of the mininet" rel="tag">revenge of the mininet</a>, <a href="http://andybeard.eu/tag/search-engines" title="search engines" rel="tag">search engines</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/site-navigation" title="Site Navigation" rel="tag">Site Navigation</a>, <a href="http://andybeard.eu/tag/ultimate-tag-warrior" title="ultimate tag warrior" rel="tag">ultimate tag warrior</a>, <a href="http://andybeard.eu/tag/utw" title="utw" rel="tag">utw</a>, <a href="http://andybeard.eu/tag/website-traffic" title="website traffic" rel="tag">website traffic</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/121/how-a-blogroll-can-kill-your-pagerank.html/feed</wfw:commentRss>
		<slash:comments>70</slash:comments>
		</item>
		<item>
		<title>Google Broke My Christmas * (Supplemental Result Query Changes)</title>
		<link>http://andybeard.eu/1136/google-broke-my-christmas-supplemental-result-query-changes.html</link>
		<comments>http://andybeard.eu/1136/google-broke-my-christmas-supplemental-result-query-changes.html#comments</comments>
		<pubDate>Thu, 20 Dec 2007 01:30:17 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[blogging tips]]></category>
		<category><![CDATA[Google]]></category>
		<category><![CDATA[SEO Blog]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[supplemental results]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[tags]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2007/12/google-broke-my-christmas-supplemental-result-query-changes.html</guid>
		<description><![CDATA[<p>If you read the Google blog or the <a href="http://searchengineland.com/071219-122926.php">coverage on Search Engine Land</a>, you might be rejoicing that <a href="http://googlewebmastercentral.blogspot.com/2007/12/ultimate-fate-of-supplemental-results.html">supplemental results are no more</a></p>
<p>It has been described as <a href="http://www.twentysteps.com/lipstick-on-a-pig/">lipstick on a pig</a> and others have just <a href="http://www.businessol.com/seo-blog/2007/12/top-5-lessons-from-death-of-google.html">offered tips on site indexing</a>.</p>
<h3>What Happened To My /* Search Query?</h3>
<p>Before this change, one of the tools still available to SEO practitioners to give an indication of the depth of site indexing was to add /* to the end on a site: search query.</p>
<p>Thus you would use</p>
<p>site:andybeard.eu/ - this would return the total pages supposedly indexed
site:andybeard.eu/* - this would return the</p>]]></description>
			<content:encoded><![CDATA[
<p>If you read the Google blog or the <a href="http://searchengineland.com/071219-122926.php">coverage on Search Engine Land</a>, you might be rejoicing that <a href="http://googlewebmastercentral.blogspot.com/2007/12/ultimate-fate-of-supplemental-results.html">supplemental results are no more</a></p>
<p>It has been described as <a href="http://www.twentysteps.com/lipstick-on-a-pig/">lipstick on a pig</a> and others have just <a href="http://www.businessol.com/seo-blog/2007/12/top-5-lessons-from-death-of-google.html">offered tips on site indexing</a>.</p>
<h3>What Happened To My /* Search Query?</h3>
<p>Before this change, one of the tools still available to SEO practitioners to give an indication of the depth of site indexing was to add /* to the end on a site: search query.</p>
<p>Thus you would use</p>
<p>site:andybeard.eu/ &#8211; this would return the total pages supposedly indexed<br />
site:andybeard.eu/* &#8211; this would return the number of pages in the primary index</p>
<p>By subtracting one from the other, you get some indication of the number of pages that might be in the supplemental results.</p>
<p>The numbers changed on a daily basis, and by datacenter, and were a little unpredictable, but it at least gave some indication.</p>
<p>Some sites I routinely checked for comparison were <a href="http://seobook.com">seo book</a>, <a href="http://wolf-howl.com">Michael Gray</a>, <a href="http://seomoz.org">Seomoz</a>, <a href="http://sphinn.com">Sphinn</a>, <a href="http://searchengineland.com">Search Engine Land</a>, <a href="http://searchenginejournal.com">Search Engine Journal</a>, <a href="http://bumpzee.com">Bumpzee</a>, <a href="http://blogcatalog.com">Blogcatalog</a>, <a href="http://mybloglog.com">Mybloglog</a> and a number of others.</p>
<p>Typically Seo Book and Michael Gray had very deep index penetration, with above 90% of their pages in the primary index as indicated by /*</p>
<p>Many of the higher output SEO blogs faired far worse, with sometimes less than 50% primary index penetration, but far more total pages in the primary index.</p>
<p>Site structure makes a huge difference &#8211; if you have lots of duplicate content pages such as extensive use of tagging, you might end up with a fair number of those pages in the Supplemental Index because they do not receive a huge amount of links from external sources, and many receive a very small percentage of internal linking.<br />
They would however still rank well for long tail search queries because of the different title tag, and combinations of content presented.</p>
<p><strong>A wider net sometimes has bigger holes&#8230;</strong></p>
<h3>/* Now Returns Significantly Fewer Results</h3>
<p>SEO Book now returns less than 50% of pages with /*<br />
Michael manages 50%<br />
SEOmoz has less than 20%<br />
Search Engine Land seems to be fairing well with close to 75%, actually more than previously (I seem to remember less than 50%)<br />
Search Engine Journal also manages close to 75%, again more than previously (again it was less than 50%)</p>
<p>I have dropped down to around 30% what was previously 85%, though my site structure isn&#8217;t quite the same as I had it before WordPress 2.3.1 (I still need to get some plugins modified)<br />
Site structure might have had as much as a 10 or 20% difference, but not more.</p>
<p>I still see very little difference in Search traffic or positioning</p>
<h3>I Don&#8217;t Know What It Means&#8230;</h3>
<ul>
<li>It could be some datacenter issues that mean that only a small percentage of sites have so far been updated</li>
<li>I am currently discounting this being some kind of penalty</li>
<li>Rather than reducing the size of the supplemental index, Google might now be storing the majority of pages in Supplemental, and effectively have a &#8220;super primary&#8221; index instead.</li>
<li>The tool could just be broken or set to give random results</li>
</ul>
<p>I can understand the removal of supplemental results from the primary SERPs, but /* was actually quite useful. If supplemental results have disappeared, you would expect it to return the same number of pages as the search query without /*</p>
<p>Why do we have a useful tool fubarred?</p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F1136%252Fgoogle-broke-my-christmas-supplemental-result-query-changes.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Google%20Broke%20My%20Christmas%20%2A%20%28Supplemental%20Result%20Query%20Changes%29%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/supplemental-results" title="supplemental results" rel="tag">supplemental results</a>, <a href="http://andybeard.eu/tag/tagging" title="tagging" rel="tag">tagging</a>, <a href="http://andybeard.eu/tag/tags" title="tags" rel="tag">tags</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/1136/google-broke-my-christmas-supplemental-result-query-changes.html/feed</wfw:commentRss>
		<slash:comments>12</slash:comments>
		</item>
		<item>
		<title>Do Google Hate Paid Links, Duplicate Content and Cruft?</title>
		<link>http://andybeard.eu/709/google-duplicate-content.html</link>
		<comments>http://andybeard.eu/709/google-duplicate-content.html#comments</comments>
		<pubDate>Wed, 02 May 2007 11:59:01 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[Google]]></category>
		<category><![CDATA[SEO Blog]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[page load]]></category>
		<category><![CDATA[paid links]]></category>
		<category><![CDATA[paid reviews]]></category>
		<category><![CDATA[search engine optimization]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2007/05/google-duplicate-content.html</guid>
		<description><![CDATA[
<p>Eric Enge Interviews Adam Lasnik about paid links, duplicate content and crufty pages (lots of code, little content)</p>
<h3>Takeaways</h3>
<p>I am sorry to say not a lot, it reinforces Google&#8217;s position not to really say a lot, though apparently there is no real penalty for duplicate content, and not to worry about how pagerank flows in your site.</p>
<p><a href="http://andybeard.eu/709/google-duplicate-content.html" class="more-link">Read more on Do Google Hate Paid Links, Duplicate Content and Cruft?&#8230;</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F709%252Fgoogle-duplicate-content.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Do%20Google%20Hate%20Paid%20Links%2C%20Duplicate%20Content%20and%20Cruft%3F%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/google" title="Google" rel="tag">Google</a>, <a href="http://andybeard.eu/tag/page-load" title="page load" rel="tag">page load</a>, <a href="http://andybeard.eu/tag/paid-links" title="paid links" rel="tag">paid links</a>, <a href="http://andybeard.eu/tag/paid-reviews" title="paid reviews" rel="tag">paid reviews</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a><br />
]]></description>
			<content:encoded><![CDATA[
<p>Eric Enge Interviews Adam Lasnik about paid links, duplicate content and crufty pages (lots of code, little content)</p>
<h3>Takeaways</h3>
<p>I am sorry to say not a lot, it reinforces Google&#8217;s position not to really say a lot, though apparently there is no real penalty for duplicate content, and not to worry about how pagerank flows in your site.</p>
<p>So if you ended up with some of your internal pages PR5, and your home page PR2, don&#8217;t worry, you won&#8217;t have a problem selling extremely below market price text links&#8230; cough</p>
<p>About the reporting of paid links Adam had this to say:-</p>
<blockquote><p>One of the most important points to make of this is that this is used to augment our data, and it&#8217;s not used to specifically take actions against sites.</p></blockquote>
<p>.. plus quite a bit more about how this is really just to &#8220;augment&#8221; existing data.</p>
<p>On snitching&#8230;</p>
<blockquote><p>But, on the reassuring side, we&#8217;ve had some people voice concerns &#8220;what happens if my competitor decides to report my pages, even though they are completely following the webmaster guidelines. Is some action going to be taken?&#8221; The answer to that is definitively not, because this does not lead directly into an action pipeline, but rather it is used only for review. It is not going to directly or adversely affect any pages or sites that are following the webmaster guidelines.</p></blockquote>
<p>I did leave a comment and have exchanged emails with Eric over something related. We will see if what I have discovered is related or just a bug.</p>
<p>I did give Eric&#8217;s interview a Digg, as it is very suitable for a home page. It is not really SEO, but &#8220;Google&#8221; after all.</p>
<p><a href="http://digg.com/tech_news/Exclusive_Google_s_Adam_Lasnik_on_Paid_Links_Duplicate_Content">Digg Story</a></p>
<p>Go on, give it one, I need to get my Digg account a little more credible, and that helps you too.</p>
<p>Read the full interview with <a href="http://www.stonetemple.com/articles/interview-adam-lasnik.shtml">Google&#8217;s Adam Lasnik</a></p>
<h3>Update: The Paid Link Meme</h3>
<p>I thought I would add this as some counter-perspective on Adam Lasnik&#8217;s position, and that of Matt Cutts and Google in regards to paid links.<br />
They have always argued that paid links are always detectable. <a href="http://www.wolf-howl.com/grayhat-seo/the-paid-link-blog-meme/">Graywolf blew that theory apart.</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F709%252Fgoogle-duplicate-content.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Do%20Google%20Hate%20Paid%20Links%2C%20Duplicate%20Content%20and%20Cruft%3F%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/google" title="Google" rel="tag">Google</a>, <a href="http://andybeard.eu/tag/page-load" title="page load" rel="tag">page load</a>, <a href="http://andybeard.eu/tag/paid-links" title="paid links" rel="tag">paid links</a>, <a href="http://andybeard.eu/tag/paid-reviews" title="paid reviews" rel="tag">paid reviews</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/709/google-duplicate-content.html/feed</wfw:commentRss>
		<slash:comments>6</slash:comments>
		</item>
		<item>
		<title>Are Yahoo Guilty of Unethical Plagiarism With Syndicated Content?</title>
		<link>http://andybeard.eu/594/are-yahoo-guilty-of-unethical-plagiarism-with-syndicated-content.html</link>
		<comments>http://andybeard.eu/594/are-yahoo-guilty-of-unethical-plagiarism-with-syndicated-content.html#comments</comments>
		<pubDate>Fri, 30 Mar 2007 16:46:07 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[news]]></category>
		<category><![CDATA[afp]]></category>
		<category><![CDATA[attribution]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[ethics]]></category>
		<category><![CDATA[hoax]]></category>
		<category><![CDATA[links]]></category>
		<category><![CDATA[museum of hoaxes]]></category>
		<category><![CDATA[press]]></category>
		<category><![CDATA[rss]]></category>
		<category><![CDATA[syndication]]></category>
		<category><![CDATA[yahoo]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2007/03/are-yahoo-guilty-of-unethical-plagiarism-with-syndicated-content.html</guid>
		<description><![CDATA[<p>Bloggers often complain that another blogger has stolen their content (plagiarism) or reworked their ideas without giving credit, and on the internet among bloggers, credit isn&#039;t just mentioning their names but providing a link, preferably to the original article.</p>
<h3>Major Websites and Press Agencies Seriously Don&#039;t Give a Damn About Conventions</h3>
<p></p>
<p><div style="width:400px;" class="important">I am not a lawyer, this post is personal opinion. Please treat any legal information as for entertainment purposes only</div>
</p>
<p>Vipul Arora wrote a story today entitled <a href="http://www.leftimpact.com/20070330-16/yahoo-plagiarizes-content-does-not-give-credit.html">Yahoo plagiarizes content - does not give credit!!</a></p>
<p>But was it plagiarism?</p>
<p>Lets go into detail and see what happens, and how this all</p>]]></description>
			<content:encoded><![CDATA[
<p>Bloggers often complain that another blogger has stolen their content (plagiarism) or reworked their ideas without giving credit, and on the internet among bloggers, credit isn&#8217;t just mentioning their names but providing a link, preferably to the original article.</p>
<h3>Major Websites and Press Agencies Seriously Don&#8217;t Give a Damn About Conventions</h3>
<p></p>
<p><div style="width:400px;" class="important">I am not a lawyer, this post is personal opinion. Please treat any legal information as for entertainment purposes only</div>
</p>
<p>Vipul Arora wrote a story today entitled <a href="http://www.leftimpact.com/20070330-16/yahoo-plagiarizes-content-does-not-give-credit.html">Yahoo plagiarizes content &#8211; does not give credit!!</a></p>
<p>But was it plagiarism?</p>
<p>Lets go into detail and see what happens, and how this all works.</p>
<p>Museum of Hoaxes publish a great piece of linkbait &#8220;<a href="http://www.museumofhoaxes.com/hoax/aprilfool/">Top100 April Fool&#8217;s Hoaxes of All Time</a>&#8221;</p>
<p><img src='http://cdn5.andybeard.name/wp-content/uploads/museum-hoaxes.jpg' alt='Museum of Hoaxes' /></p>
<h3>The Missing Pointer</h3>
<p><a href="http://www.afp.com">AFP </a>Picks up the story</p>
<p>Now unfortunately AFP doesn&#8217;t include a link through to the original source of the material it used. Links provide attribution on the internet and are used by visitors to read the rest of the story (only the top10 was published, not all 100 items), and by <a href="http://andybeard.eu/2007/01/articles-are-seeds-of-knowledge-a-biblical-look-at-duplicate-content.html">search engines in their calculation of the original source</a>.</p>
<p>I am not sure where the law is on this, they only used 10% of the material, and they did provide attribution in textual form. They also didn&#8217;t use the content word for word.</p>
<p>Then again in value to readers the Top 10 is probably worth more than positions 20 &#8211; 100</p>
<blockquote><p>Here are 10 of the top April Fool&#8217;s Day pranks ever pulled off, as judged by the San Diego-based Museum of Hoaxes for their notoriety, absurdity, and number of people duped.</p></blockquote>
<p>You might think this is a minor issue, but <a href="http://www.google.com/search?hl=en&#038;&#038;q=%22Ten+of+the+best+April+Fool%E2%80%99s+Day+hoaxes">Google currently shows the title of the story on 10,900 websites.</a></p>
<h3>Yahoo Plagiarism?</h3>
<p>Yahoo was the most prominent site that picked up the story &#8211; they have permission from AFP to use the content that legally probably isn&#8217;t plagiarism, but bloggers if it happened to them would be very upset, unless they gave specific permission.</p>
<p><img src='http://cdn5.andybeard.name/wp-content/uploads/yahoo-hoaxes.jpg' alt='Yahoo Hoaxes' /></p>
<p>Yahoo are in many ways the innocent party in this, but ultimately the site that is benefiting from the content the most. It is a very popular story that has already garnered over 900 votes on Yahoo. That is a lot of votes as not every reader would click the vote button.</p>
<p>Just imagine if there was a link through to the original source</p>
<h3>Effect on Traffic</h3>
<p>The Museum of Hoaxes should have had a tidal wave of eager readers visiting their site. It is possible they gained a small surge from search traffic from people who were interested in finding the rest of the Top100.</p>
<p>The story should have also done insanely well on social bookmarking services.</p>
<p><img src='http://cdn5.andybeard.name/wp-content/uploads/museum-of-hoaxes.png' alt='Museum of Hoaxes on Digg' /></p>
<p>This is actually an extreme example of what happens when correct attribution (in internet terms) isn&#8217;t given by the press to the original author of an article.</p>
<h3>Printed Media</h3>
<p>Printed media in the UK, if referencing a website, typically use a service such as TinyURL.com to provide a link from an article so that they don&#8217;t have to print a long URL &#8211; that is a very ethical method, though I would question why they don&#8217;t spend $20 and buy their own redirect script that can be branded.</p>
<h3>A Similar Example</h3>
<p>This is actually a similar situation to what happened with Colleen who was recently interviewed by the <a href="http://andybeard.eu/2007/03/womma-should-watch-who-they-quote-and-especially-who-they-link-to.html">LA Times regarding PayPerPost</a>.</p>
<p>The followup video interview was a cracker, and you really should read the comments for a discussion on <a href="http://andybeard.eu/2007/03/payperpost-ted-murphy-vs-jason-calacanis-the-ultimate-showdown.html">ThisNext vs PayPerPost</a>, and whether you should have to use a disclosure when commenting.</p>
<p>I should also point out that I have seen a number of blogs that have also written about the LA Times story, and linked to their syndication partners ;)</p>
<h3>Pot Calling the Kettle Black</h3>
<p>The press shouldn&#8217;t attack the ethics of bloggers if they don&#8217;t provide correct attribution for the medium in which they are working. On TV it is verbal, in print it is written, and the best print even provide short links.</p>
<p><strong>Online correct attribution is links.</strong> </p>
<p>Even Wikipedia provide a clickable click, <a href="http://en.wikipedia.org/wiki/April_Fools'_Day">although it does use nofollow</a> </p>
<p>Note: Screenshots were used with permission from Vipul, it saved me 5 minutes preparing this. He has contacted AFP questioning their method of attribution.</p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F594%252Fare-yahoo-guilty-of-unethical-plagiarism-with-syndicated-content.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Are%20Yahoo%20Guilty%20of%20Unethical%20Plagiarism%20With%20Syndicated%20Content%3F%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/afp" title="afp" rel="tag">afp</a>, <a href="http://andybeard.eu/tag/attribution" title="attribution" rel="tag">attribution</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/ethics" title="ethics" rel="tag">ethics</a>, <a href="http://andybeard.eu/tag/hoax" title="hoax" rel="tag">hoax</a>, <a href="http://andybeard.eu/tag/links" title="links" rel="tag">links</a>, <a href="http://andybeard.eu/tag/museum-of-hoaxes" title="museum of hoaxes" rel="tag">museum of hoaxes</a>, <a href="http://andybeard.eu/tag/news" title="news" rel="tag">news</a>, <a href="http://andybeard.eu/tag/press" title="press" rel="tag">press</a>, <a href="http://andybeard.eu/tag/rss" title="rss" rel="tag">rss</a>, <a href="http://andybeard.eu/tag/syndication" title="syndication" rel="tag">syndication</a>, <a href="http://andybeard.eu/tag/yahoo" title="yahoo" rel="tag">yahoo</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/594/are-yahoo-guilty-of-unethical-plagiarism-with-syndicated-content.html/feed</wfw:commentRss>
		<slash:comments>5</slash:comments>
		</item>
		<item>
		<title>In Depth: Google BlogSearch &#124; Ranking Blog Documents Patent</title>
		<link>http://andybeard.eu/543/google-blog-search.html</link>
		<comments>http://andybeard.eu/543/google-blog-search.html#comments</comments>
		<pubDate>Fri, 23 Mar 2007 13:24:02 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[blogging tips]]></category>
		<category><![CDATA[Google]]></category>
		<category><![CDATA[plugins]]></category>
		<category><![CDATA[SEO Blog]]></category>
		<category><![CDATA[backlinks]]></category>
		<category><![CDATA[blogging]]></category>
		<category><![CDATA[bloglines]]></category>
		<category><![CDATA[blogsearch]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[feedburner]]></category>
		<category><![CDATA[Google Blog Search]]></category>
		<category><![CDATA[google blogsearch]]></category>
		<category><![CDATA[linking strategy]]></category>
		<category><![CDATA[rss]]></category>
		<category><![CDATA[RSS Subscribers]]></category>
		<category><![CDATA[search engine optimization]]></category>
		<category><![CDATA[search engines]]></category>
		<category><![CDATA[subscribers]]></category>
		<category><![CDATA[tag]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[tags]]></category>
		<category><![CDATA[technorati]]></category>
		<category><![CDATA[Technorati Favorites]]></category>
		<category><![CDATA[ultimate tag warrior]]></category>
		<category><![CDATA[utw]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2007/03/google-blog-search.html</guid>
		<description><![CDATA[
<div style="float:right;"><img src='http://cdn5.andybeard.name/wp-content/uploads/rel-tag.png' alt='Using Internal tags with Ultimate Tag Warrior' /></div>
<p>For a long time my blogs have performed amazingly well with <a href="http://blogsearch.google.com/">Google Blog Search</a>. I always appear in the relevant results quickly, and the results I obtain have some reasonable longevity, even when I am not the original source of a story.</p>
<p><a href="http://andybeard.eu/543/google-blog-search.html" class="more-link">Read more on In Depth: Google BlogSearch &#124; Ranking Blog Documents Patent&#8230;</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F543%252Fgoogle-blog-search.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22In%20Depth%3A%20Google%20BlogSearch%20%7C%20Ranking%20Blog%20Documents%20Patent%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/backlinks" title="backlinks" rel="tag">backlinks</a>, <a href="http://andybeard.eu/tag/blogging" title="blogging" rel="tag">blogging</a>, <a href="http://andybeard.eu/tag/bloglines" title="bloglines" rel="tag">bloglines</a>, <a href="http://andybeard.eu/tag/blogsearch" title="blogsearch" rel="tag">blogsearch</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/feedburner" title="feedburner" rel="tag">feedburner</a>, <a href="http://andybeard.eu/tag/google" title="Google" rel="tag">Google</a>, <a href="http://andybeard.eu/tag/google-blog-search" title="Google Blog Search" rel="tag">Google Blog Search</a>, <a href="http://andybeard.eu/tag/google-blogsearch" title="google blogsearch" rel="tag">google blogsearch</a>, <a href="http://andybeard.eu/tag/linking-strategy" title="linking strategy" rel="tag">linking strategy</a>, <a href="http://andybeard.eu/tag/rss" title="rss" rel="tag">rss</a>, <a href="http://andybeard.eu/tag/rss-subscribers" title="RSS Subscribers" rel="tag">RSS Subscribers</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/search-engines" title="search engines" rel="tag">search engines</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/subscribers" title="subscribers" rel="tag">subscribers</a>, <a href="http://andybeard.eu/tag/tag" title="tag" rel="tag">tag</a>, <a href="http://andybeard.eu/tag/tagging" title="tagging" rel="tag">tagging</a>, <a href="http://andybeard.eu/tag/tags" title="tags" rel="tag">tags</a>, <a href="http://andybeard.eu/tag/technorati" title="technorati" rel="tag">technorati</a>, <a href="http://andybeard.eu/tag/technorati-favorites" title="Technorati Favorites" rel="tag">Technorati Favorites</a>, <a href="http://andybeard.eu/tag/ultimate-tag-warrior" title="ultimate tag warrior" rel="tag">ultimate tag warrior</a>, <a href="http://andybeard.eu/tag/utw" title="utw" rel="tag">utw</a><br />
]]></description>
			<content:encoded><![CDATA[
<div style="float:right;"><img src='http://cdn5.andybeard.name/wp-content/uploads/rel-tag.png' alt='Using Internal tags with Ultimate Tag Warrior' /></div>
<p>For a long time my blogs have performed amazingly well with <a href="http://blogsearch.google.com/">Google Blog Search</a>. I always appear in the relevant results quickly, and the results I obtain have some reasonable longevity, even when I am not the original source of a story.</p>
<p>Considering how much competition I often have for certain search terms which everyone seems to be writing about because of common interest, I must have been doing a number of things right.</p>
<p>Bill Slawski of SEO By The Sea a few of days ago <a href="http://www.seobythesea.com/?p=541">broke the news</a> of Google&#8217;s Patent Application for <a href="http://appft1.uspto.gov/netacgi/nph-Parser?Sect1=PTO1&#038;Sect2=HITOFF&#038;d=PG01&#038;p=1&#038;u=%2Fnetahtml%2FPTO%2Fsrchnum.html&#038;r=1&#038;f=G&#038;l=50&#038;s1=%2220070061297%22.PGNR.&#038;OS=DN/20070061297&#038;RS=DN/20070061297">Ranking Blog Documents</a>.</p>
<p><a href="http://www.seroundtable.com/archives/012753.html">SEO Round Table</a> posted a synopsis lifted from the <a href="http://www.cre8asiteforums.com/forums/index.php?showtopic=47645">Cre8asite Forum</a>s that had been posted by Bill, and seems to be the easiest to understand.</p>
<p>I am going to do a little bit of mix and match here, and inject my own commentary but my interpretation of the patent is actually slightly different to those that I have read so far.</p>
<p>It should be noted I am working my way through the patent itself, and <strong>not recompiling the summaries of others</strong>.</p>
<h3>Relevancy &#038; Quality &#8211; Blog | Blogpost</h3>
<p>It should first of all be noted that in the patent Google doesn&#8217;t differentiate between individual blog posts and whole blogs.</p>
<blockquote><p>The phrase &#8220;blog document,&#8221; as used hereinafter, is to be broadly interpreted to include a blog, a blog post, or both a blog and a blog post. It will be appreciated that the techniques described herein are equally applicable to blogs and blog posts.</p></blockquote>
<p>Later on in the patent, they also mention that feeds are also included within the documents that are compared and rated.</p>
<blockquote><p>
two distinct sets of data are used to determine a score of a blog (or blog post) in response to a search query&#8211;the topical relevance of the blog (or blog post) to the terms in the search query and the quality of the blog (or blog post), which is independent of the query terms. The quality of the blog (or blog post) may positively or negatively affect the score of the blog (or blog post)
</p></blockquote>
<p>Relevancy &#8211; this applies to the search term, thus Google will analyse the blog page, and they will also in some way determine the relevance to the whole blog.<br />
Quality &#8211; this is irrespective of the search term, so think about factors from outside your niche </p>
<h3>Google Blog Search &#8211; Positive Factors Affecting Search Quality | Relevancy</h3>
<ul>
<li><strong>Popularity of the blog document</strong></li>
<blockquote><p>A number of news aggregator sites (commonly called &#8220;news readers&#8221; or &#8220;feed readers&#8221;) exist where individuals can subscribe to a blog document (through its feed). Such aggregators store information describing how many individuals have subscribed to given blog documents. A blog document having a high number of subscriptions implies a higher quality for the blog document</p></blockquote>
<p>This patent was first of all applied for  13th September 2005, with Google Blog Search launched 13 September 2005. At the time they were logically not basing this on numbers available for Google Reader subscribers. The Google Reader blog was launched October 21, 2005 with a post saying they had been up and running for 2 weeks.<br />
Maybe there is a coincidence between the 2 events.</p>
<p>So which data were Google basing this part of their patent on? Some services such as Technorati and Bloglines do provide readership data, as does Feedburner, though most services report readership data as they are collecting new blog posts to a service like Feedburner, who aggregate the statistics.</p>
<p>It seems there might be some value is collecting Technorati favorites (my reciprocation policy might be well worth it) beyond limited bragging rights. Google of course through Google Reader now have access to lots of usage data, so maybe other sources will eventually be phased out.</p>
<li><strong>Implied popularity of the blog document</strong></li>
<blockquote><p>This implied popularity may be identified by, for example, examining the click stream of search results. For example, if a certain blog document is clicked more than other blog documents when the blog document appears in result sets, this may be an indication that the blog document is popular and, thus, a positive indicator of the quality of the blog document. </p></blockquote>
<p>Click data from search results, possible from Google Toolbar users.</p>
<li><strong>Existence of the blog document in blogrolls</strong></li>
<blockquote><p>The existence of the blog document in blogrolls may be a positive indication of the quality of the blog document. It will be appreciated that blog documents often contain not only recent entries (i.e., posts), but also &#8220;blogrolls,&#8221; which are a dense collection of links to external sites (usually other blogs) in which the author/blogger is interested. A blogroll link to a blog document is an indication of popularity of that blog document, so aggregated blogroll links to a blog document can be counted and used to infer magnitude of popularity for the blog document. </p></blockquote>
<p>Everything I have ever read has suggested that for normal search, blogroll links that are site wide carry diminishing value. Just because it is listed here as part of the calculation does not necessarily mean that everyone should start building up huge blogrolls&#8230; well unless they want to game Technorati and have a blog network.</p>
<li><strong>Existence of the blog document in a high quality blogroll</strong></li>
<blockquote><p>The existence of the blog document in a high quality blogroll may be a positive indication of the quality of the blog document. A high quality blogroll is a blogroll that links to well-known or trusted bloggers. Therefore, a high quality blogroll that also links to the blog document is a positive indicator of the quality of the blog document. </p></blockquote>
<p>Another revelation, links on high quality pages are worth more than links on low quality pages.</p>
<p>Remember that <em>&#8220;blog document&#8221;</em> can mean both <strong>blog page</strong> and <strong>blog site</strong>. </p>
<p>Can blogroll just refer to a list of links on what is identified as a blog. Thus a column of links to related pages might also class as a blogroll, whether in the sidebar or below the content.<br />
Thus a list of links to related documents on the same site could be looked on as a blogroll on a blog document.</p>
<p>Related links plugins are very powerful, especially if you also include them in content that gets syndicated by design, or by sploggers.</p>
<li><strong>Tagging of the blog document</strong></li>
<blockquote><p>Tagging of the blog document may be a positive indication of the quality of the blog document. Some existing sites allow users to add &#8220;tags&#8221; to (i.e., to &#8220;categorize&#8221;) a blog document. These custom categorizations are an indicator that an individual has evaluated the content of the blog document and determined that one or more categories appropriately describe its content, and as such are a positive indicator of the quality of the blog document.</p></blockquote>
<p>Well some sites do allow you to tag in a meaningful way, maybe Google uses shared tags from Del.icio.us and other sites, but many of those use nofollow extensively.<br />
It is my own belief that self tagging content heavily with plugins such as Ultimate Tag Warrior helps a huge amount. I have given lots of examples before, but more recent examples include</p>
<p>toolbar pagerank<br />
google reader feedburner<br />
feedburner google reader<br />
compete toolbar<br />
duplicate content supplemental results</p>
<p>Yes, I am just going down the inbound traffic results looking for likely candidates that rank well in both blog and normal search and aren&#8217;t totally obscure. These are subjects that sites in my niche have also talked about, with the keywords in the title, and which you would expect to rank higher than my own content.</p>
<p>This doesn&#8217;t just affect blogsearch, Google have been using it for some time with the main results as well.<br />
Here are my <a href="http://andybeard.eu/2006/11/utw-tagging-seo-tricks-pt-2.html">observations regarding tagging</a> from back in November, especially how they could relate to LSI calculations.</p>
<li><strong>References to the blog document by other sources</strong></li>
<p>Wow revelation again, god links are worth having either to pages or blog.</p>
<li><strong>Pagerank of the blog document</strong></li>
</ul>
<p>Pagerank is still relevant, who knows for how long and how much.</p>
<blockquote><p>It will be appreciated that other indicators may also be used. </p></blockquote>
<p>What seems to be missing, at least at time of application?</p>
<ul>
<li>Domain age?</li>
<li>Trustrank?</li>
<li>Page Titles?</li>
<li>URLs?</li>
<li>Growth rate of link popularity</li>
</ul>
<p>Plus lots more that also factor into it, but general search patents probably also cover blog search.</p>
<h3>Google Blog Search &#8211; Negative Factors Affecting Search Relevancy | Quality</h3>
<ul>
<strong>
<li>Frequency of new posts on the blog document</li>
<p></strong></p>
<blockquote><p>The frequency at which new posts are added to the blog document may be a negative indication of the quality of that blog document. Feeds typically include only the most recent posts from a blog document. Spammers often generate new posts in spurts (i.e., many new posts appear within a short time period) or at predictable intervals (one post every 10 minutes, or a post every 3 hours at 32 minutes past the hour). Both behaviors are correlated with malicious intent and can be used to identify possible spammers. Therefore, if the frequency at which new posts are added to the blog document matches a predictable pattern, this may be a negative indication of the quality of the blog document. </p></blockquote>
<p>Make sure there is some variation when you publish your content for the day, especially with future dated posts.<br />
Most spamming tools are actually fairly sophisticated, thus I am not sure this measurement is very accurate. It most likely indicated a blogger who is very organised these days.</p>
<p><strong>
<li>The content of the posts in the blog document</li>
<p></strong></p>
<blockquote><p>
The content of the posts in the blog document may be a negative indication of the quality of that blog document. A feed typically contains some or all of the content of several posts from a given blog document. The blog document itself also includes the content of the posts. Spammers may put one version of content into a feed to improve their ranking in search results, while putting a different version on their blog document (e.g., links to irrelevant ads). This mismatch (between feed and blog document) can, therefore, be a negative indication of the quality of the blog document.</p></blockquote>
<p>This is actually a very significant and interestingly worded item. Google are stating that they are comparing the content of a feed with the content on your pages to ensure it matches.</p>
<p>Based upon this:-</p>
<ul>
<li>Don&#8217;t use a content spinner on your feeds to avoid duplicate content</li>
<li>Allow Google to index your feeds</li>
<li>If you use related links on your blog, make sure you use them in your feeds too</li>
</ul>
<p><strong>
<li>Duplicate Content, especially in feeds</li>
<p></strong></p>
<blockquote><p>
Also, in some instances, particular content may be duplicated in multiple posts in a blog document, resulting in multiple feeds containing the same content. Such duplication indicates the feed is low quality/spam and, thus, can be a negative indication of the quality of the blog document.
</p></blockquote>
<p>I can&#8217;t say I have noticed a problem having a lot of straggling RSS feeds on categories and tags.<br />
This could also be referring to things like the large footer I have on each post, though I haven&#8217;t seen a problem with that either.</p>
<p>After the last <a href="http://andybeard.eu/2007/01/toolbar-pagerank-ball-linking.html">toolbar pagerank update</a> I spent some time studying Matt Cutts&#8217; blog, and also looking at how pagerank was being transferred around my own site. Pagerank is only slightly useful as a guide, and only immediately after an update.<br />
Rather than repeat myself, you can read about my <a href="http://andybeard.eu/2007/01/toolbar-pagerank-ball-linking.html">organic garden approach</a> to this site.</p>
<p><strong></p>
<li>Collective Intelligence
</li>
<p></strong></p>
<blockquote><p>The words/phrases used in the posts of a blog document may also be a negative indication of the quality of that blog document. For example, from a collection of blog documents and feeds that evaluators rate as spam, a list of words and phrases (bigrams, trigrams, etc.) that appear frequently in spam may be extracted. If a blog document contains a high percentage of words or phrases from the list, this can be a negative indication of quality of the blog document.</p></blockquote>
<p>Google invest a lot of research analysing spam, detecting various word matching patterns, and use that to identify other documents.</p>
<p><strong>
<li>A size of the posts in the blog document</li>
<p></strong></p>
<blockquote><p>
The size of the posts in a blog document may be a negative indication of quality of the blog document. Many automated post generators create numerous posts of identical or very similar length. As a result, the distribution of post sizes can be used as a reliable measure of spamminess. When a blog document includes numerous posts of identical or very similar length, this may be a negative indication of quality of the blog document.</p></blockquote>
<p>This might be of special interest to those that use out-sourcing for articles, you need to ensure the article length changes.</p>
<p><strong>
<li>A link distribution of the blog document</li>
<p></strong></p>
<blockquote><p>A link distribution of the blog document may be a negative indication of quality of the blog document. As disclosed above, some posts are created to increase the pagerank of a particular blog document. In some cases, a high percentage of all links from the posts or from the blog document all point to ether a single web page, or to a single external site. If the number of links to any single external site exceeds a threshold, this can be a negative indication of quality of the blog document.</p></blockquote>
<p>In some ways this debunks the benefits of blogrolls mentioned as a benefit, but as previously quoted, Google are using blog document in multiple context, and comparing the context, thus it could just refer to multiple spam links always pointing to a single domain within the content.</p>
<p><strong>
<li>The presence of ads in the blog document</li>
<p></strong></p>
<blockquote><p>The presence of ads in the blog document may be a negative indication of quality of the blog document. If a blog document contains a large number of ads, this may be a negative indication of the quality of the blog document. </p></blockquote>
<p>Remember this is just a patent, and Google recently relaxed the rules about having ads from other networks along with Adsense. As long as a page is of a reasonable size to support the adverts, I don&#8217;t think there is a problem. If you just have a heading and 5 words, with 10 advertising blocks, you might want to add a few more words.</p>
<p>However they go on to say this</p>
<blockquote><p>Moreover, blog documents typically contain three types of content: the content of recent posts, a blogroll, and blog metadata (e.g., author profile information and/or other information pertinent to the blog document or its author). Ads, if present, typically appear within the blog metadata section or near the blogroll. The presence of ads in the recent posts part of a blog document may be a negative indication of the quality of the blog document. </p></blockquote>
<p>Thus if you are using blocks in the content for all your ads, you might not rank as well, especially if you use multiple networks. You can probably get away with 3 in the content, or maybe 1 or 2 per post.</p>
<p><strong>
<li>It will be appreciated that other indicators may also be used</li>
<p></strong></p>
</ul>
<h3>Conclusion</h3>
<p>The feed stats information is very useful, and looking at the timing, my conclusion is that Google might have been using Bloglines and Technorati Favorites data, with Google Reader in its infancy, or maybe though less likely, when blog search was introduced, they weren&#8217;t using that part of the patent</p>
<p>For me the most significant information was tagging, but just linking though to Technorati with your tags isn&#8217;t a great idea.</p>
<p>Remember that Google have their own blogging system, and they have archives and labels, and they are not going to create a system to generate duplicate content and then penalise you for it. Google wouldn&#8217;t have added such a system unless they intended to benefit from the enhanced data.</p>
<p><strong>You don&#8217;t have to build your blogs in a 1990s era tree like structure to rank well.</strong></p>
<p><a href="http://andybeard.eu/feed/">Subscribers</a> and <a href="http://technorati.com/faves?add=http://andybeard.eu">Technorati Favorites</a> may help you rank.</p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F543%252Fgoogle-blog-search.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22In%20Depth%3A%20Google%20BlogSearch%20%7C%20Ranking%20Blog%20Documents%20Patent%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/backlinks" title="backlinks" rel="tag">backlinks</a>, <a href="http://andybeard.eu/tag/blogging" title="blogging" rel="tag">blogging</a>, <a href="http://andybeard.eu/tag/bloglines" title="bloglines" rel="tag">bloglines</a>, <a href="http://andybeard.eu/tag/blogsearch" title="blogsearch" rel="tag">blogsearch</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/feedburner" title="feedburner" rel="tag">feedburner</a>, <a href="http://andybeard.eu/tag/google" title="Google" rel="tag">Google</a>, <a href="http://andybeard.eu/tag/google-blog-search" title="Google Blog Search" rel="tag">Google Blog Search</a>, <a href="http://andybeard.eu/tag/google-blogsearch" title="google blogsearch" rel="tag">google blogsearch</a>, <a href="http://andybeard.eu/tag/linking-strategy" title="linking strategy" rel="tag">linking strategy</a>, <a href="http://andybeard.eu/tag/rss" title="rss" rel="tag">rss</a>, <a href="http://andybeard.eu/tag/rss-subscribers" title="RSS Subscribers" rel="tag">RSS Subscribers</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/search-engines" title="search engines" rel="tag">search engines</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/subscribers" title="subscribers" rel="tag">subscribers</a>, <a href="http://andybeard.eu/tag/tag" title="tag" rel="tag">tag</a>, <a href="http://andybeard.eu/tag/tagging" title="tagging" rel="tag">tagging</a>, <a href="http://andybeard.eu/tag/tags" title="tags" rel="tag">tags</a>, <a href="http://andybeard.eu/tag/technorati" title="technorati" rel="tag">technorati</a>, <a href="http://andybeard.eu/tag/technorati-favorites" title="Technorati Favorites" rel="tag">Technorati Favorites</a>, <a href="http://andybeard.eu/tag/ultimate-tag-warrior" title="ultimate tag warrior" rel="tag">ultimate tag warrior</a>, <a href="http://andybeard.eu/tag/utw" title="utw" rel="tag">utw</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/543/google-blog-search.html/feed</wfw:commentRss>
		<slash:comments>18</slash:comments>
		</item>
		<item>
		<title>Articles Are Seeds of Knowledge &#8211; A Biblical Look at Duplicate Content</title>
		<link>http://andybeard.eu/322/articles-are-seeds-of-knowledge-a-biblical-look-at-duplicate-content.html</link>
		<comments>http://andybeard.eu/322/articles-are-seeds-of-knowledge-a-biblical-look-at-duplicate-content.html#comments</comments>
		<pubDate>Sun, 28 Jan 2007 16:56:05 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[marketing]]></category>
		<category><![CDATA[Article Distribution]]></category>
		<category><![CDATA[article marketing]]></category>
		<category><![CDATA[Article Syndication]]></category>
		<category><![CDATA[bible]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[gideons]]></category>
		<category><![CDATA[top10]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2007/01/articles-are-seeds-of-knowledge-a-biblical-look-at-duplicate-content.html</guid>
		<description><![CDATA[
<p>It is Sunday although I am not a very religious person, thus I was, horror of horrors, outside shovelling snow around. It was drifting, and if I hadn&#8217;t done anything with it, it might have blocked the driveway for my wife Monday morning.</p>
<p><a href="http://andybeard.eu/322/articles-are-seeds-of-knowledge-a-biblical-look-at-duplicate-content.html" class="more-link">Read more on Articles Are Seeds of Knowledge &#8211; A Biblical Look at Duplicate Content&#8230;</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F322%252Farticles-are-seeds-of-knowledge-a-biblical-look-at-duplicate-content.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Articles%20Are%20Seeds%20of%20Knowledge%20-%20A%20Biblical%20Look%20at%20Duplicate%20Content%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/article-distribution" title="Article Distribution" rel="tag">Article Distribution</a>, <a href="http://andybeard.eu/tag/article-marketing" title="article marketing" rel="tag">article marketing</a>, <a href="http://andybeard.eu/tag/article-syndication" title="Article Syndication" rel="tag">Article Syndication</a>, <a href="http://andybeard.eu/tag/bible" title="bible" rel="tag">bible</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/gideons" title="gideons" rel="tag">gideons</a>, <a href="http://andybeard.eu/tag/top10" title="top10" rel="tag">top10</a><br />
]]></description>
			<content:encoded><![CDATA[
<p>It is Sunday although I am not a very religious person, thus I was, horror of horrors, outside shovelling snow around. It was drifting, and if I hadn&#8217;t done anything with it, it might have blocked the driveway for my wife Monday morning.</p>
<p>Does your mind wander when you are doing a physical job that doesn&#8217;t require much other thought? Mine certainly does.</p>
<h3>Duplicate Content of Biblical Proportions</h3>
<p>I have been doing some research of &#8220;Top 10 Lists&#8221; for a new site. Whilst no list of the top 10 best selling books is exactly the same, there is one common feature. Every single top 10 list states that The Bible in all its variations has sold more than 6 billion copies.<br />
That is close to the current world population, estimated by the CIA to be 6,525,170,264 (July 2006 est.)<br />
Thus there are probably as many bibles in the world as people</p>
<p>That is an awful lot of duplicate content</p>
<h3>Gideons</h3>
<p><a href="http://www.gideons.org/">Gideons</a> is an interesting organisation, whose work is evangelism and distribution of the bible. You will see Gideons bibles in every hotel room, and I was given a Gideons bible whilst at school in addition to a larger bible I was issued for Religious Education lessons.  </p>
<p>With the help of the Gideons organisation, whenever you need a bible, there is one close at hand.</p>
<h3>Spread the Word</h3>
<p>This is a fundamental concept in all religion, not just Christian. It is not enough to have the knowledge and faith, you are also meant to pass it onto other people. Lots of the time the knowledge will fall on deaf ears. If the knowledge is out there, and easy to find even without specifically looking for it, such as in a hotel room drawer, it has a benefit.</p>
<h3>Worthwhile Duplicate Content</h3>
<p>I am sure many of those 6 billion bibles are in dusty attics, unused drawers, or buried at the back on shelves, long forgotten. Every now and then one copy gets rediscovered, unearthed or brought out of hiding.</p>
<h3>The Bible and Duplicate Content</h3>
<p>A church is not the only place you can find a copy of the bible. I am sure many religious people read more of the bible while in church than the cumulative total of all other places, but that doesn&#8217;t make it pointless to have multiple copies in your home, school, library and even hotel rooms. All those copies of the bible are seeds, and every now and then one of those seeds gets picked up and begins to germinate, wherever the seed is located.</p>
<h3>Your Articles and Duplicate Content</h3>
<p>I recently wrote a mammoth blog post on my philosophy with <a href="http://andybeard.eu/2007/01/article-marketing.html">article marketing</a>. Many marketing experts believe that article marketing no longer works, or you should be highly selective where you publish your content.</p>
<p>I mentioned a strategy, that as long as you link back to the original source for your content that people can follow, it makes sense to spread your article as widely as possible.<br />
I don&#8217;t discount special publishing deals that will bring your article to the forefront of thousands of people, but that opportunity is often reserved for established writers.</p>
<h3>Articles Are Seeds of Knowledge</h3>
<p>Spread your articles far and wide. Sometimes they will land in fertile soil, and germinate and grow almost immediately. Whilst I wouldn&#8217;t dare liken <a href="http://ezinearticles.com">EzineArticles</a> to a church, it certainly is very fertile ground for your seeds to grow.</p>
<p>Some of your articles will almost certainly end up landing on less fertile ground, or buried deep in a website long forgotten. It is a seed that hasn&#8217;t germinated yet, but one day it might be uncovered and grow into a tree bearing fruit.</p>
<p>Sometimes your article may end up on even more unsavoury territory, with a link to you not being provided, or even worse plagiarised. It will happen, such is the nature of people. If the purpose of your article was to help people more than market yourself, then it really doesn&#8217;t matter if occasionally the link to you is broken. A person reading your article is still going to look for further knowledge on the subject, and eventually find their way to respected sources of information, such as yourself, just as someone picking up a Gideon&#8217;s bible might eventually find their way to a church.</p>
<p><strong>If you don&#8217;t sow your seeds, they don&#8217;t have a chance to grow</strong></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F322%252Farticles-are-seeds-of-knowledge-a-biblical-look-at-duplicate-content.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Articles%20Are%20Seeds%20of%20Knowledge%20-%20A%20Biblical%20Look%20at%20Duplicate%20Content%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/article-distribution" title="Article Distribution" rel="tag">Article Distribution</a>, <a href="http://andybeard.eu/tag/article-marketing" title="article marketing" rel="tag">article marketing</a>, <a href="http://andybeard.eu/tag/article-syndication" title="Article Syndication" rel="tag">Article Syndication</a>, <a href="http://andybeard.eu/tag/bible" title="bible" rel="tag">bible</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/gideons" title="gideons" rel="tag">gideons</a>, <a href="http://andybeard.eu/tag/top10" title="top10" rel="tag">top10</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/322/articles-are-seeds-of-knowledge-a-biblical-look-at-duplicate-content.html/feed</wfw:commentRss>
		<slash:comments>12</slash:comments>
		</item>
		<item>
		<title>Toolbar Pagerank &#124; Ball Linking</title>
		<link>http://andybeard.eu/310/toolbar-pagerank-ball-linking.html</link>
		<comments>http://andybeard.eu/310/toolbar-pagerank-ball-linking.html#comments</comments>
		<pubDate>Thu, 25 Jan 2007 14:46:34 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[blogging tips]]></category>
		<category><![CDATA[Google]]></category>
		<category><![CDATA[mininet]]></category>
		<category><![CDATA[SEO Blog]]></category>
		<category><![CDATA[vre]]></category>
		<category><![CDATA[Blog Linking]]></category>
		<category><![CDATA[Blog Traffic]]></category>
		<category><![CDATA[Deep Linking]]></category>
		<category><![CDATA[defensible traffic]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[Dynamic Linking]]></category>
		<category><![CDATA[Google PageRank]]></category>
		<category><![CDATA[link popularity]]></category>
		<category><![CDATA[Link Strategy]]></category>
		<category><![CDATA[linking]]></category>
		<category><![CDATA[linking strategy]]></category>
		<category><![CDATA[matt cutts]]></category>
		<category><![CDATA[nofollow]]></category>
		<category><![CDATA[pagerank]]></category>
		<category><![CDATA[PageRank Update]]></category>
		<category><![CDATA[revenge of the mininet]]></category>
		<category><![CDATA[search engine glossary]]></category>
		<category><![CDATA[search engine optimisation]]></category>
		<category><![CDATA[search engine optimization]]></category>
		<category><![CDATA[seo blogs]]></category>
		<category><![CDATA[Site Navigation]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2007/01/toolbar-pagerank-ball-linking.html</guid>
		<description><![CDATA[
<p>Google have finally updated their toolbar pagerank for this site, not just on the front page, but also a lot of the deeper pages. Not all of them &#8211; some of those devoid of pagerank should probably have some, others probably shouldn&#8217;t especially moved content that hasn&#8217;t been given enough love.</p>
<p><a href="http://andybeard.eu/310/toolbar-pagerank-ball-linking.html" class="more-link">Read more on Toolbar Pagerank &#124; Ball Linking&#8230;</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F310%252Ftoolbar-pagerank-ball-linking.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Toolbar%20Pagerank%20%7C%20Ball%20Linking%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/blog-linking" title="Blog Linking" rel="tag">Blog Linking</a>, <a href="http://andybeard.eu/tag/blog-traffic" title="Blog Traffic" rel="tag">Blog Traffic</a>, <a href="http://andybeard.eu/tag/blogging-tips" title="blogging tips" rel="tag">blogging tips</a>, <a href="http://andybeard.eu/tag/deep-linking" title="Deep Linking" rel="tag">Deep Linking</a>, <a href="http://andybeard.eu/tag/defensible-traffic" title="defensible traffic" rel="tag">defensible traffic</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/dynamic-linking" title="Dynamic Linking" rel="tag">Dynamic Linking</a>, <a href="http://andybeard.eu/tag/google-pagerank" title="Google PageRank" rel="tag">Google PageRank</a>, <a href="http://andybeard.eu/tag/link-popularity" title="link popularity" rel="tag">link popularity</a>, <a href="http://andybeard.eu/tag/link-strategy" title="Link Strategy" rel="tag">Link Strategy</a>, <a href="http://andybeard.eu/tag/linking" title="linking" rel="tag">linking</a>, <a href="http://andybeard.eu/tag/linking-strategy" title="linking strategy" rel="tag">linking strategy</a>, <a href="http://andybeard.eu/tag/matt-cutts" title="matt cutts" rel="tag">matt cutts</a>, <a href="http://andybeard.eu/tag/mininet" title="mininet" rel="tag">mininet</a>, <a href="http://andybeard.eu/tag/nofollow" title="nofollow" rel="tag">nofollow</a>, <a href="http://andybeard.eu/tag/pagerank" title="pagerank" rel="tag">pagerank</a>, <a href="http://andybeard.eu/tag/pagerank-update" title="PageRank Update" rel="tag">PageRank Update</a>, <a href="http://andybeard.eu/tag/revenge-of-the-mininet" title="revenge of the mininet" rel="tag">revenge of the mininet</a>, <a href="http://andybeard.eu/tag/search-engine-glossary" title="search engine glossary" rel="tag">search engine glossary</a>, <a href="http://andybeard.eu/tag/search-engine-optimisation" title="search engine optimisation" rel="tag">search engine optimisation</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/seo-blogs" title="seo blogs" rel="tag">seo blogs</a>, <a href="http://andybeard.eu/tag/site-navigation" title="Site Navigation" rel="tag">Site Navigation</a><br />
]]></description>
			<content:encoded><![CDATA[
<p>Google have finally updated their toolbar pagerank for this site, not just on the front page, but also a lot of the deeper pages. Not all of them &#8211; some of those devoid of pagerank should probably have some, others probably shouldn&#8217;t especially moved content that hasn&#8217;t been given enough love.</p>
<p>As I have discussed in the past, when discussing <a href="http://andybeard.eu/2006/10/revenge-of-the-mininet-3rd-party-content-blog-comments-no-follow.html">blog internal linking</a>, for this blog I am doing &#8220;massive ball linking&#8221;.</p>
<p><img src='http://cdn5.andybeard.name/wp-content/uploads/2007/01/ball-or-structured.png' alt='Ball Linking or Structured' /></p>
<p>Links come into the blog from various places and to specific content. By using tagging and related posts on each page (maybe a few too many now), whatever pagerank, trust and relevance that a page is given, get passed onto other relevant content.</p>
<p>It also gets passed onto people who leave comments or trackback. <strong>When you link to me from your blog posts, the juice flows back</strong> &#8211; sometimes more, sometimes less, but it is all relevant links &#8211; just what the web is all about.</p>
<p>I suppose you could look on this as a &#8220;organic garden&#8221; approach. Just let things grow wild, and only interfere if something needs drastic change.</p>
<p>I haven&#8217;t been overly worried about the multiple forms of duplicate content that are typical on a WordPress blog.</p>
<h3>Exactly Why I Don&#8217;t Worry About Duplicate Content</h3>
<p>First of all I discussed this a little not so long ago, in particular about <a href="http://andybeard.eu/2007/01/matt-cutts-pagerank-supplemental-results.html"><strong>duplicate content</strong> and <strong>supplemental results</strong></a>.</p>
<p>Matt Cutts isn&#8217;t worried about <strong>honest duplicate content</strong></p>
<h3>Proof &#8211; Matt Really isn&#8217;t worried</h3>
<p>First of all lets take at look at Matt&#8217;s robots.txt file</p>
<blockquote><p>User-agent: *<br />
Allow:
</p></blockquote>
<p>Then you can look at the metadata on all Matts duplicate content pages</p>
<p>Category archives &#8211; I am going to link to his <a href="http://www.mattcutts.com/blog/type/glossarydefinitions/">seo glossary</a>, I am sure it doesn&#8217;t get many links.<br />
<a href="http://www.mattcutts.com/blog/2006/10/">Date Archives</a><br />
Sequential pages &#8211; lets <a href="http://www.mattcutts.com/blog/page/3/">go back in time a few pages</a></p>
<pre class="brush: xml; title: ; notranslate">
&lt;meta http-equiv=&quot;Content-Type&quot; content=&quot;text/html; charset=UTF-8&quot; /&gt;
&lt;title&gt;Matt Cutts: Gadgets, Google, and SEO &amp;raquo; Movies/Videos&lt;/title&gt;
&lt;meta name=&quot;generator&quot; content=&quot;WordPress 2.0.7&quot; /&gt; &lt;!-- leave this for stats --&gt;
&lt;meta name=&quot;robots&quot; content=&quot;noodp&quot;&gt;
</pre>
<p>Basically he lets the search engines work out what is going on.</p>
<p>There are simple plugins out there to prevent these pages being indexed and followed in various ways, but Matt Cutts doesn&#8217;t worry about it.</p>
<p><a href="http://web.archive.org/web/20060328225949/www.mattcutts.com/blog/">The Wayback Machine</a></p>
<p>Yep, more duplicate content &#8211; Matt doesn&#8217;t block them</p>
<p>Matt Doesn&#8217;t even block the <a href="http://www.mattcutts.com/blog/wp-login.php">login page</a> to his WordPress installation &#8211; that same page appears over 2 million times on the web.</p>
<h3>Let it Flow</h3>
<p>OMG I am wasting all that Google Juice that I worked so hard for!</p>
<p>Or maybe not&#8230;</p>
<p>Google Juice is liquid&#8230; it flows, it you give it a direction to flow in.</p>
<p>Whilst you may give a page with duplicate content some juice, that juice flows back out to other pages. Just because that page might end up in the supplemental results, doesn&#8217;t mean the Google juice is being wasted.</p>
<p>Some blog designs unfortunately place too much emphasis on the most current content. They don&#8217;t use tags, their date archives are accessed by a silly calendar widget on the front page, and they don&#8217;t have any other routes for pagerank to flow. </p>
<h3>Structured Linking</h3>
<p>It is possible to use only a very structured linking system for a blog, but it is important to think about relevance. In Revenge of the Mininet there are some great linking structures defined. They would be ideal for highly &#8220;niched&#8221; sites.</p>
<p>Many blogs, including this one, cover a wide multitude of subjects. A carefully constructed linking structure would be much harder to define and you might lose the benefit of giving relevance to specific pages.</p>
<h3>Structured Relevance?</h3>
<p>Some duplicate content pages give great, maybe even enhanced relevance to content.<br />
Date archives in many blog designs are not very helpful. If date archives and previous pages are used as the primary navigation to previous content, and path for search engines to take, you really aren&#8217;t giving your content any justice or longevity.</p>
<h3>Content Longevity</h3>
<p>Lets look at some of my internal pages for longevity</p>
<p><a href="http://andybeard.eu/2006/11/how-a-blogroll-can-kill-your-pagerank.html">How a Blogroll can kill your Pagerank</a> &#8211; 2 month old post, linked to a few times in posts, but it appears a lot on pages due to tagging and using related posts &#8211; <strong>currently PR4</strong></p>
<p><a href="http://andybeard.eu/2006/12/nofollow-and-pink-boxes.html">NoFollow and Pink Boxes</a> &#8211; <strong>also PR4</strong></p>
<p>Some posts on UTW Tips &#8211; <strong>both PR3</strong></p>
<p><a href="http://andybeard.eu/2006/11/ultimate-tag-warrior-seo-tricks-pt-1.html">Ultimate Tag Warrior SEO Tricks (pt 1)</a><br />
<a href="http://andybeard.eu/2006/11/utw-tagging-seo-tricks-pt-2.html">UTW &#8211; Tagging SEO Tricks (pt 2)</a></p>
<p>From browsing around, I have discovered that the Google Toolbar Pagerank isn&#8217;t completely comprehensive, as I have posts that should have PR4 that don&#8217;t. One of them was my highest ranking page in November and December.</p>
<p>It was hard to find a post that hadn&#8217;t been later referred to in a more recent post but this is a good example:-</p>
<p><a href="http://andybeard.eu/2006/11/no-nofollow-no-nofollowcom.html">No NoFollow &#038; No-Nofollow.com</a></p>
<p>That post is again PR3, and didn&#8217;t receive any specific direct love from outside links or internal links in posts. It did benefit from tagging, and related posts.</p>
<p>This time around I didn&#8217;t tag and categorize my old content from my blogspot domain. Almost all of that content didn&#8217;t receive much pagerank love unless it had been linked to directly.<br />
I am going to see if for the next update it can be revitalized.</p>
<p><strong>How much of your old content retains visible pagerank?</strong></p>
<p>It is actually still difficult to compare, because so many pages still haven&#8217;t received pagerank they probably deserve. Even Matt has some pages that are linked to from PR6 categories that show a toolbar pagerank of zero such as http://www.mattcutts.com/blog/starving-to-death-review/</p>
<p>I would link to it directly with a live link, but I don&#8217;t want to ruin the example</p>
<p>For one of Matts posts that one probably received <a href="http://search.yahoo.com/search?p=link%3Ahttp%3A//www.mattcutts.com/blog/starving-to-death-review/+-site%3Amattcutts.com">a lot less inbound links</a></p>
<p>Yes that is a Yahoo link &#8211; wouldn&#8217;t it be nice to have a &#8220;-all&#8221; flag on Google searches to list everything below Google&#8217;s threshold as well, even if it is just an aid for webmasters to find splogs. </p>
<h3>Conclusion</h3>
<p>Matt is a busy man, maybe he hasn&#8217;t had time to optimize and avoid all these duplicate content issues but I really believe it is nothing to worry about, and Matt might just be demonstrating this  with his own blog.</p>
<p>You can aim for a more focused structure on a blog, using various forms of dynamic linking but it is not something easy to achieve yet with any platform.</p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F310%252Ftoolbar-pagerank-ball-linking.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Toolbar%20Pagerank%20%7C%20Ball%20Linking%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/blog-linking" title="Blog Linking" rel="tag">Blog Linking</a>, <a href="http://andybeard.eu/tag/blog-traffic" title="Blog Traffic" rel="tag">Blog Traffic</a>, <a href="http://andybeard.eu/tag/blogging-tips" title="blogging tips" rel="tag">blogging tips</a>, <a href="http://andybeard.eu/tag/deep-linking" title="Deep Linking" rel="tag">Deep Linking</a>, <a href="http://andybeard.eu/tag/defensible-traffic" title="defensible traffic" rel="tag">defensible traffic</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/dynamic-linking" title="Dynamic Linking" rel="tag">Dynamic Linking</a>, <a href="http://andybeard.eu/tag/google-pagerank" title="Google PageRank" rel="tag">Google PageRank</a>, <a href="http://andybeard.eu/tag/link-popularity" title="link popularity" rel="tag">link popularity</a>, <a href="http://andybeard.eu/tag/link-strategy" title="Link Strategy" rel="tag">Link Strategy</a>, <a href="http://andybeard.eu/tag/linking" title="linking" rel="tag">linking</a>, <a href="http://andybeard.eu/tag/linking-strategy" title="linking strategy" rel="tag">linking strategy</a>, <a href="http://andybeard.eu/tag/matt-cutts" title="matt cutts" rel="tag">matt cutts</a>, <a href="http://andybeard.eu/tag/mininet" title="mininet" rel="tag">mininet</a>, <a href="http://andybeard.eu/tag/nofollow" title="nofollow" rel="tag">nofollow</a>, <a href="http://andybeard.eu/tag/pagerank" title="pagerank" rel="tag">pagerank</a>, <a href="http://andybeard.eu/tag/pagerank-update" title="PageRank Update" rel="tag">PageRank Update</a>, <a href="http://andybeard.eu/tag/revenge-of-the-mininet" title="revenge of the mininet" rel="tag">revenge of the mininet</a>, <a href="http://andybeard.eu/tag/search-engine-glossary" title="search engine glossary" rel="tag">search engine glossary</a>, <a href="http://andybeard.eu/tag/search-engine-optimisation" title="search engine optimisation" rel="tag">search engine optimisation</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/seo-blogs" title="seo blogs" rel="tag">seo blogs</a>, <a href="http://andybeard.eu/tag/site-navigation" title="Site Navigation" rel="tag">Site Navigation</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/310/toolbar-pagerank-ball-linking.html/feed</wfw:commentRss>
		<slash:comments>4</slash:comments>
		</item>
		<item>
		<title>Duplicate Content</title>
		<link>http://andybeard.eu/160/duplicate-content.html</link>
		<comments>http://andybeard.eu/160/duplicate-content.html#comments</comments>
		<pubDate>Thu, 07 Dec 2006 07:38:01 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[SEO Blog]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[search engine optimization]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2006/12/duplicate-content.html</guid>
		<description><![CDATA[
<p>Lee Odden has a great overview on duplicate content issues.</p>
<p>He is blogging various sessions from the Chicago Search Engine Strategies conference.</p>
<p>Here are the bullet points from just one of the speakers on the session (Shari Thurow), and I bolded one of them</p>
<p><a href="http://andybeard.eu/160/duplicate-content.html" class="more-link">Read more on Duplicate Content&#8230;</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F160%252Fduplicate-content.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Duplicate%20Content%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a><br />
]]></description>
			<content:encoded><![CDATA[
<p>Lee Odden has a great overview on duplicate content issues.</p>
<p>He is blogging various sessions from the Chicago Search Engine Strategies conference.</p>
<p>Here are the bullet points from just one of the speakers on the session (Shari Thurow), and I bolded one of them</p>
<blockquote><p>Ways that search engines filter out redundant content:</p>
<p>    * Content properties &#8211; removes boilerplate elements and reviews whatâ€™s left<br />
    * <strong>Linkage properties &#8211; Is a press release on the wire service and the press release on a web site duplicate content? No, because the linkage properties are distinctly different, even though the content is the same</strong><br />
    * Content evolution &#8211; most content does not change. High average page mutation &#8211; news site. Low would be a manufacturing site<br />
    * Host name resolution &#8211; If the hostname resolves to the same domain name, one version of the redundant content will be selected as the canonical url<br />
    * Shingle comparison &#8211; References Andrei Broder. Shingles are word sets. The more shingles that a document has, the more likely it is duplicate content.
</p></blockquote>
<p>There is very little difference between article marketing and press releases.</p>
<p>The big difference is in the other navigation elements on the page.</p>
<p>If you are using one of the very popular article site scripts, work hard in differentiating your site from other sites using the same script, especially if you are receiving the articles from a similar source such as Article Marketer.</p>
<p>The same would be true of people using RSS feeds from Article directories. If you are not doing anything to change the linking structures of a page and relationships between content, you are not going to achieve the results you want.</p>
<p>Do take the trouble to pop over to Lee&#8217;s blog and read the full article:- <a href="http://www.toprankblog.com/2006/12/duplicate-content-and-multiple-site-issues/">Duplicate Content and Multiple Site Issues</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F160%252Fduplicate-content.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22Duplicate%20Content%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/160/duplicate-content.html/feed</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>International Article Syndication</title>
		<link>http://andybeard.eu/143/international-article-syndication.html</link>
		<comments>http://andybeard.eu/143/international-article-syndication.html#comments</comments>
		<pubDate>Sat, 25 Nov 2006 11:41:26 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[Google]]></category>
		<category><![CDATA[marketing]]></category>
		<category><![CDATA[article marketing]]></category>
		<category><![CDATA[Article Submission]]></category>
		<category><![CDATA[Article Syndication]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[google alert]]></category>
		<category><![CDATA[google translate]]></category>
		<category><![CDATA[machine translation]]></category>
		<category><![CDATA[search engine optimization]]></category>
		<category><![CDATA[SEO Blog]]></category>
		<category><![CDATA[site monitoring]]></category>
		<category><![CDATA[translation]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2006/11/international-article-syndication.html</guid>
		<description><![CDATA[
<p>I use Google Alerts to track a lot of my article syndication, and sometimes it comes up with some absolute diamonds of ways content can be presented to an international audience.</p>
<p><a href="http://andybeard.eu/143/international-article-syndication.html" class="more-link">Read more on International Article Syndication&#8230;</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F143%252Finternational-article-syndication.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22International%20Article%20Syndication%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/article-marketing" title="article marketing" rel="tag">article marketing</a>, <a href="http://andybeard.eu/tag/article-submission" title="Article Submission" rel="tag">Article Submission</a>, <a href="http://andybeard.eu/tag/article-syndication" title="Article Syndication" rel="tag">Article Syndication</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/google" title="Google" rel="tag">Google</a>, <a href="http://andybeard.eu/tag/google-alert" title="google alert" rel="tag">google alert</a>, <a href="http://andybeard.eu/tag/google-translate" title="google translate" rel="tag">google translate</a>, <a href="http://andybeard.eu/tag/machine-translation" title="machine translation" rel="tag">machine translation</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/site-monitoring" title="site monitoring" rel="tag">site monitoring</a>, <a href="http://andybeard.eu/tag/translation" title="translation" rel="tag">translation</a><br />
]]></description>
			<content:encoded><![CDATA[
<p>I use Google Alerts to track a lot of my article syndication, and sometimes it comes up with some absolute diamonds of ways content can be presented to an international audience.</p>
<p>My original article was <a href="http://andybeard.eu/2005/07/keywords-ranking-and-a-little-seo-fun.html">Keywords, ranking and a little SEO fun</a>. It is over 16 months old but still spreading.</p>
<p><a href="http://www.vaitman.com/tr/cn/?q=/seo/55469.php">Take a look at this website in Chineese</a> (I am not sure which Chineese)</p>
<p>First impression, you can&#8217;t understand a word of it&#8230; correct?</p>
<p>Try moving your mouse over the article content &#8211; up pops the original English phrase.</p>
<p>I am not sure exactly how they are doing this, and technically translation can be looked on as an unauthorised modification of the original work, but honestly I don&#8217;t care.</p>
<p>The way they have done this is extremely smart, especially if they have used some form of machine translation. For any phrase that wasn&#8217;t translated correcty, there is an immediate reference to the original document.<br />
In addition Google are picking up the live backlinks surrounded by English text.</p>
<p>This is a feature that translation services such as Google Translate need to make their translation more useful.</p>
<p>It is one of the most innovative uses I have ever seen for duplicate 3rd party content.</p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F143%252Finternational-article-syndication.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22International%20Article%20Syndication%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/article-marketing" title="article marketing" rel="tag">article marketing</a>, <a href="http://andybeard.eu/tag/article-submission" title="Article Submission" rel="tag">Article Submission</a>, <a href="http://andybeard.eu/tag/article-syndication" title="Article Syndication" rel="tag">Article Syndication</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/google" title="Google" rel="tag">Google</a>, <a href="http://andybeard.eu/tag/google-alert" title="google alert" rel="tag">google alert</a>, <a href="http://andybeard.eu/tag/google-translate" title="google translate" rel="tag">google translate</a>, <a href="http://andybeard.eu/tag/machine-translation" title="machine translation" rel="tag">machine translation</a>, <a href="http://andybeard.eu/tag/search-engine-optimization" title="search engine optimization" rel="tag">search engine optimization</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/site-monitoring" title="site monitoring" rel="tag">site monitoring</a>, <a href="http://andybeard.eu/tag/translation" title="translation" rel="tag">translation</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/143/international-article-syndication.html/feed</wfw:commentRss>
		<slash:comments>4</slash:comments>
		</item>
		<item>
		<title>UTW &#8211; Tagging SEO Tricks (pt 2)</title>
		<link>http://andybeard.eu/140/utw-tagging-seo-tricks-pt-2.html</link>
		<comments>http://andybeard.eu/140/utw-tagging-seo-tricks-pt-2.html#comments</comments>
		<pubDate>Sat, 25 Nov 2006 09:19:27 +0000</pubDate>
		<dc:creator>Andy Beard</dc:creator>
				<category><![CDATA[Google]]></category>
		<category><![CDATA[plugins]]></category>
		<category><![CDATA[SEO Blog]]></category>
		<category><![CDATA[backlinks]]></category>
		<category><![CDATA[Blog Navigation]]></category>
		<category><![CDATA[blogging tips]]></category>
		<category><![CDATA[duplicate content]]></category>
		<category><![CDATA[folksonomy]]></category>
		<category><![CDATA[Google Results]]></category>
		<category><![CDATA[linking strategy]]></category>
		<category><![CDATA[msn]]></category>
		<category><![CDATA[relevant content]]></category>
		<category><![CDATA[search engines]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[tags]]></category>
		<category><![CDATA[ultimate tag warrior]]></category>
		<category><![CDATA[utw]]></category>
		<category><![CDATA[white hat]]></category>
		<category><![CDATA[wordpress]]></category>
		<category><![CDATA[wordpress plugins]]></category>
		<category><![CDATA[yahoo]]></category>

		<guid isPermaLink="false">http://andybeard.eu/2006/11/utw-tagging-seo-tricks-pt-2.html</guid>
		<description><![CDATA[
<p>This is not a technical trick, but something that many people who confuse categories and tagging really need to get a grasp of.<br />
It is also my belief that this is very much a white-hat strategy, but as with all forms of search engine marketing, it can be abused.</p>
<p><a href="http://andybeard.eu/140/utw-tagging-seo-tricks-pt-2.html" class="more-link">Read more on UTW &#8211; Tagging SEO Tricks (pt 2)&#8230;</a></p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F140%252Futw-tagging-seo-tricks-pt-2.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22UTW%20-%20Tagging%20SEO%20Tricks%20%28pt%202%29%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/backlinks" title="backlinks" rel="tag">backlinks</a>, <a href="http://andybeard.eu/tag/blog-navigation" title="Blog Navigation" rel="tag">Blog Navigation</a>, <a href="http://andybeard.eu/tag/blogging-tips" title="blogging tips" rel="tag">blogging tips</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/folksonomy" title="folksonomy" rel="tag">folksonomy</a>, <a href="http://andybeard.eu/tag/google" title="Google" rel="tag">Google</a>, <a href="http://andybeard.eu/tag/google-results" title="Google Results" rel="tag">Google Results</a>, <a href="http://andybeard.eu/tag/linking-strategy" title="linking strategy" rel="tag">linking strategy</a>, <a href="http://andybeard.eu/tag/msn" title="msn" rel="tag">msn</a>, <a href="http://andybeard.eu/tag/relevant-content" title="relevant content" rel="tag">relevant content</a>, <a href="http://andybeard.eu/tag/search-engines" title="search engines" rel="tag">search engines</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/tagging" title="tagging" rel="tag">tagging</a>, <a href="http://andybeard.eu/tag/tags" title="tags" rel="tag">tags</a>, <a href="http://andybeard.eu/tag/ultimate-tag-warrior" title="ultimate tag warrior" rel="tag">ultimate tag warrior</a>, <a href="http://andybeard.eu/tag/utw" title="utw" rel="tag">utw</a>, <a href="http://andybeard.eu/tag/white-hat" title="white hat" rel="tag">white hat</a>, <a href="http://andybeard.eu/tag/wordpress" title="wordpress" rel="tag">wordpress</a>, <a href="http://andybeard.eu/tag/wordpress-plugins" title="wordpress plugins" rel="tag">wordpress plugins</a>, <a href="http://andybeard.eu/tag/yahoo" title="yahoo" rel="tag">yahoo</a><br />
]]></description>
			<content:encoded><![CDATA[
<p>This is not a technical trick, but something that many people who confuse categories and tagging really need to get a grasp of.<br />
It is also my belief that this is very much a white-hat strategy, but as with all forms of search engine marketing, it can be abused.</p>
<p>Categories are for storing your documents into nice managable chucks on related topics.</p>
<p>Tagging can and should go far beyond categories in relating content to specific keywords.</p>
<p><strong>Here is a good example:-</strong></p>
<p>WordPress Training<br />
Wordpress Tutorials<br />
Wordpress Tuition</p>
<p>I would suggest you wouldn&#8217;t want to have all 3 phrases as a category in your sidebar. You could however be quite justified in tagging a related article with all 3 phrases, if they were appropriate.</p>
<p><strong>There are several reasons for this:-</strong></p>
<p><large>1.</large> Tag searches do not use LSI. They do however quite often display related tags. The more data you provide related to your article, the more accurately it can be classified, and later found. In many ways your tags should be very tightly related LSI keywords.</p>
<p>2. MYSQL Search &#8211; lets face it, it isn&#8217;t highly effective. If someone is searching your site, the chances of them finding what they are looking for are remote unless you provide a lot of keywords on a page.</p>
<p>3. Folksonomy provides a better way to search when you use tag clouds to provide visual suggestions for what a reader may be looking for. In my example above, &#8220;training&#8221;, &#8220;tuition&#8221; and &#8220;tutorials&#8221; actually provide different stimulai</p>
<p>4. Better references to related content</p>
<p>Lets say you have a niche blog on dogs.</p>
<p>You might have categories on dog training, dog health, dog accessories etc</p>
<p>You might use tags to interrelate articles on dog training at feeding time, dog food, and dog bowl.</p>
<p>5. Making your website wider &#8211; making a better mouse-trap</p>
<p>Does Google really give penalties for duplicate content, or duplicate content that doesn&#8217;t have a specific purpose?</p>
<p>It is my belief that Google doesn&#8217;t give duplicate content penalties for content that has a specific purpose, that they can easily identify.</p>
<p>Technorati is all duplicate content, but it has a purpose, helping people find what they are looking for. I noted recently that <a href="http://andybeard.eu/2006/11/wordpresscom-linking-structure.html" rel="tag">tag pages</a> at WordPress.com which are also full of duplicate content, give great backlinks for the blogs hosted there.</p>
<h2>Google Likes Tag Pages</h2>
<p>I think Google in some way within their algorithms are allowing duplicate content if it is on a page that is clearly a tag page, whether on an authority site, or on individual websites.</p>
<p>It is easy for people to spot such a page, they normally use tag or tags in the URL. If they wanted to algorithmically wipe out all that duplicate content they could with a wave of their hand.</p>
<p>But they haven&#8217;t&#8230; in fact pages that Google identifies as a tag page, it might be argued, are sometimes given a boost in search engine results.</p>
<h2>I am sure you want some proof</h2>
<p>I can&#8217;t give you total proof. </p>
<p>This is based upon my observations on multiple domains I own or monitor closely. I am not going to openly reveal all my niche sites (people try all kinds of ways to search for them every day, and they find old sites that have been allowed to be found).</p>
<p>I will give you one example though, which I noticed today.</p>
<p>This example is based upon the following:-</p>
<p>This is quite a new domain, but I do have an existing domain andybeard.name redirecting here with a global 301. I also have an existing blog on blogspot redirecting here with a meta refresh.<br />
I have a few &#8220;exposed&#8221; niche sites linking back to this site.</p>
<p>That being said, Google doesn&#8217;t seem to be showing any backlinks (there are quite a few of them), though other search engines are.<br />
It has been reported recently that Google are giving enhanced results to blog search within their main listings, especially in Europe which is a frequent test location. This isn&#8217;t related, <a href="http://www.boydcreative.net/google/google-integrating-blog-posts-into-search-results/">because those results were appearing at the bottom of the Google listings</a>.</p>
<p>I am located in Poland, and my IP address is Polish. Someone located in the US might see something different, using the same search URLs.</p>
<p>Here is a screenshot of a search result I noticed today. This one is on Google.com, but I have also tried Google.co.uk, Google.at, Google.pl, Google.de and a few more.<br />
The results were similar. On the foreign language sites I generally held the position for the first English language result.</p>
<p><center><br />
<a href="http://cdn5.andybeard.name/wp-content/uploads/2006/11/Wordpress-Training.jpg"><img src="http://cdn5.andybeard.name/wp-content/uploads/2006/11/Wordpress-Training.jpg" alt="Google Search for WordPress Training" width="400"></a><br />
<a href="http://cdn5.andybeard.name/wp-content/uploads/2006/11/Wordpress-Training.jpg">Google Search for WordPress Training</a></center></p>
<p>It isn&#8217;t a highly competitive keyword, and the results for &#8220;WordPress Tutorials&#8221; which is more competitive are different. </p>
<p>Now I do have to admit the tag page that is gaining the result is fairly junky looking. It is a result of the way my content is laid out, and I do need to get it fixed.<br />
I include tags at the start of my content, and those tags appear at the start of any excerpt. This is true for excerpts, whether created by WordPress or by Ultimate Tag Warrior.<br />
As standard there isn&#8217;t an easy way to adjust excerpt length unless you create a custom excerpt for every post.</p>
<p>In my defense it is not deliberate keyword spamming, it is something I am aware of, and it will be fixed. I am not a programmer, I just tinker with PHP, and the tag pages and archive pages on this blog are currently &#8220;out-of-the-box&#8221; configurations.</p>
<h2>Specific to Google</h2>
<p>This weighting of tag pages seems to be specific to Google.</p>
<p>For instance for the same search on MSN my original content is ranked around 26th position, but they still have lots of tag pages showing, and it is obvious the search is not very LSI based, as lots of dog and horse training pages appear.<br />
Yahoo has fairly similar results to MSN, I have a result in 23rd place, but it is a totally different page.</p>
<h2>Folksonomy and LSI</h2>
<p>Folksonomy is in many ways the same as LSI. </p>
<p>With folksonomy the relationship between keywords is created by humans.<br />
LSI is meant to be based upon algorithms, but is a lot more complicated. It is however based on words, and it is much easier to start with a list of human word relationships and to then apply additional relationships.</p>
<p>It is my belief that Google is in some way using folksonomy as part of its LSI calculations. It is even possible that they have recently increased the relevance of that part of their calculation.</p>
<h2>Going Forward</h2>
<p>Tagging is important for folksonomy based search. Tag pages on your own domain seem to be gaining a lot of relevance in Google.</p>
<p>Over the coming weeks I am going to be working to improve the quality of my tag pages, so that they provide unique content, and enhanced value for my readers.</p>
<p>Using tags for all keyword links might add enhanced relevance.<br />
If you were buying textlinks, paid posts etc, would the value of the textlinks be enhanced if they had rel=&#8221;tag&#8221; ?</p>
<p>I have heard bloggers argue that creating links with relevant keywords is keyword spamming. In my opinion it is actually &#8220;best practice&#8221; if you are linking to someone to use a relevant keyword to the content you are linking to. It isn&#8217;t Google bombing, it is helping the search engines relate different content. If you then include rel=&#8221;tag&#8221; in the link, you are also helping folksonomy search.</p>
<p>You should maybe think carefully about your tagging strategy for 2007</p>
<div class="topsy_widget_data topsy_theme_brick-red" style="float: right;margin-left: 0.75em; background: url(data:,%7B%20%22url%22%3A%20%22http%253A%252F%252Fandybeard.eu%252F140%252Futw-tagging-seo-tricks-pt-2.html%22%2C%20%22style%22%3A%20%22small%22%2C%20%22title%22%3A%20%22UTW%20-%20Tagging%20SEO%20Tricks%20%28pt%202%29%22%20%7D);"></div>


	Tags: <a href="http://andybeard.eu/tag/backlinks" title="backlinks" rel="tag">backlinks</a>, <a href="http://andybeard.eu/tag/blog-navigation" title="Blog Navigation" rel="tag">Blog Navigation</a>, <a href="http://andybeard.eu/tag/blogging-tips" title="blogging tips" rel="tag">blogging tips</a>, <a href="http://andybeard.eu/tag/duplicate-content" title="duplicate content" rel="tag">duplicate content</a>, <a href="http://andybeard.eu/tag/folksonomy" title="folksonomy" rel="tag">folksonomy</a>, <a href="http://andybeard.eu/tag/google" title="Google" rel="tag">Google</a>, <a href="http://andybeard.eu/tag/google-results" title="Google Results" rel="tag">Google Results</a>, <a href="http://andybeard.eu/tag/linking-strategy" title="linking strategy" rel="tag">linking strategy</a>, <a href="http://andybeard.eu/tag/msn" title="msn" rel="tag">msn</a>, <a href="http://andybeard.eu/tag/relevant-content" title="relevant content" rel="tag">relevant content</a>, <a href="http://andybeard.eu/tag/search-engines" title="search engines" rel="tag">search engines</a>, <a href="http://andybeard.eu/tag/seo" title="SEO Blog" rel="tag">SEO Blog</a>, <a href="http://andybeard.eu/tag/tagging" title="tagging" rel="tag">tagging</a>, <a href="http://andybeard.eu/tag/tags" title="tags" rel="tag">tags</a>, <a href="http://andybeard.eu/tag/ultimate-tag-warrior" title="ultimate tag warrior" rel="tag">ultimate tag warrior</a>, <a href="http://andybeard.eu/tag/utw" title="utw" rel="tag">utw</a>, <a href="http://andybeard.eu/tag/white-hat" title="white hat" rel="tag">white hat</a>, <a href="http://andybeard.eu/tag/wordpress" title="wordpress" rel="tag">wordpress</a>, <a href="http://andybeard.eu/tag/wordpress-plugins" title="wordpress plugins" rel="tag">wordpress plugins</a>, <a href="http://andybeard.eu/tag/yahoo" title="yahoo" rel="tag">yahoo</a><br />
]]></content:encoded>
			<wfw:commentRss>http://andybeard.eu/140/utw-tagging-seo-tricks-pt-2.html/feed</wfw:commentRss>
		<slash:comments>14</slash:comments>
		</item>
	</channel>
</rss>

<!-- Performance optimized by W3 Total Cache. Learn more: http://www.w3-edge.com/wordpress-plugins/

Page Caching using disk: basic
Database Caching 47/125 queries in 0.030 seconds using disk: basic
Object Caching 4826/5037 objects using disk: basic
Content Delivery Network via cdn5.andybeard.name

Served from: andybeard.eu @ 2012-02-13 07:06:49 -->
