Today, the customer asked me for create a dynamic sitemap.xml file on the sitecore project. I tried to use some existing packages from the Marketplace, but they didn't work for this project. We were needing a very simple version. So... why not create a new one from the scratch? This is not a big deal.
We have 2 different approaches to do this:
Approach 1: We can create the sitemap.xml file and we can put it on the root of the folder.
- Pros: Once the file is created as a static file, the indexers could take it without an extra processing of our system.
- Cons: We have to ensure that the sitemap.xml URLs are in sync with the published items. It's because the indexer could penalize this error. Maybe we can create this file when the author publishes the items to Web database. This could resolve this issue.
Approach 2: We can create the sitemap.xml content dynamically and we can show it through a handlers.
- Pros: We are recreating the file content when the indexer is trying the take it. This could ensure an accurate content all the time without penalizations.
- Cons: The system is going to process this content each time the indexer try to take it. This could take resources from our server, but we can cache this content to resolve this issue.
I want to do something super simple. I love the simple ideas, because most of the time they are more flexible on different context. So, let's take the second approach.
We can build this handler easily, adding a new pipeline on the HttpRequestBegin. Let's remember that Sitecore address the handlers in a special way (link)
Here is the code: https://github.com/SitecoreFromArg/SimpleSitemapXml. Feel free to use it and modify it. Any contribution is welcome. Also, you have the package on the marketplace here.
If you want to change the configuration of this code to handle a sitemap with XML extension, you will need to:
- Change the configuration file of this code in the "sitemapUrl" parameter to "/sitemap.ashx"
- Change the robots.txt file to indicate the new extension of the sitemap.
- Change the IIS settings to avoid handle this file as an static file.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
User-agent: * | |
Disallow: /sitecore/ | |
Sitemap: /sitemap.ashx |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
<configuration xmlns:patch="http://www.sitecore.net/xmlconfig/"> | |
<sitecore> | |
<pipelines> | |
<httpRequestBegin> | |
<processor type="SitecoreFromArg.SimpleSitemapXml.SitemapXmlGenerator,SitecoreFromArg.SimpleSitemapXml" | |
patch:before="processor[@type='Sitecore.Pipelines.HttpRequest.CustomHandlers, Sitecore.Kernel']"> | |
<!-- | |
sitemapUrl: | |
Place in the URL where you want to put the sitemap.xml | |
cacheTime: | |
Cache time in seconds. | |
excludedPaths: | |
Collection of item paths that you want to exclude of the sitemap.xml. | |
The pipeline will exclude all items with this string as part of the path. | |
You can add more that one, separating them with a pipe | |
--> | |
<sitemapUrl>/sitemap.ashx</sitemapUrl> | |
<cacheTime>1</cacheTime> | |
<excludedPaths>/My Account/|/Customer/</excludedPaths> | |
</processor> | |
</httpRequestBegin> | |
</pipelines> | |
</sitecore> | |
</configuration> |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
using System; | |
using System.Linq; | |
using Sitecore.Pipelines.HttpRequest; | |
using Sitecore.Diagnostics; | |
using Sitecore; | |
using Sitecore.Links; | |
using System.Xml; | |
using Sitecore.Data.Items; | |
using Sitecore.Data.Fields; | |
using Sitecore.Layouts; | |
using System.Web.Caching; | |
namespace SitecoreFromArg.SimpleSitemapXml | |
{ | |
public class SitemapXmlGenerator : HttpRequestProcessor | |
{ | |
public string sitemapUrl { get; set; } | |
public string excludedPaths { get; set; } | |
public string cacheTime { get; set; } | |
public override void Process(HttpRequestArgs args) | |
{ | |
Assert.ArgumentNotNull((object)args, "args"); | |
if (Context.Site == null || string.IsNullOrEmpty(Context.Site.RootPath.Trim())) return; | |
if (Context.Page.FilePath.Length > 0) return; | |
if (!args.Url.FilePath.Contains(sitemapUrl)) return; | |
// Important to return qualified XML (text/xml) for sitemaps | |
args.Context.Response.ClearHeaders(); | |
args.Context.Response.ClearContent(); | |
args.Context.Response.ContentType = "text/xml"; | |
// Checking the cache first | |
var sitemapXmlCache = args.Context.Cache["sitemapxml"]; | |
if (sitemapXmlCache != null) | |
{ | |
args.Context.Response.Write(sitemapXmlCache.ToString()); | |
args.Context.Response.End(); | |
return; | |
} | |
// | |
var options = LinkManager.GetDefaultUrlOptions(); | |
options.AlwaysIncludeServerUrl = true; | |
// Creating the XML Header | |
var xml = new XmlTextWriter(args.Context.Response.Output); | |
xml.WriteStartDocument(); | |
xml.WriteStartElement("urlset", "http://www.sitemaps.org/schemas/sitemap/0.9"); | |
// Creating the XML Body | |
try | |
{ | |
var items = Context.Database.SelectItems("fast:" + Context.Site.RootPath + "//*"); | |
foreach (var item in items) | |
{ | |
if (IsPage(item)) | |
{ | |
if (!item.Paths.IsContentItem) continue; | |
if (excludedPaths.Split('|').Any(p => item.Paths.ContentPath.Contains(p))) continue; | |
xml.WriteStartElement("url"); | |
xml.WriteElementString("loc", LinkManager.GetItemUrl(item, options)); | |
xml.WriteElementString("lastmod", item.Statistics.Updated.ToString("yyyy-MM-ddThh:mm:sszzz")); | |
xml.WriteEndElement(); | |
} | |
} | |
} | |
finally | |
{ | |
xml.WriteEndElement(); | |
xml.WriteEndDocument(); | |
xml.Flush(); | |
// Cache XML content | |
args.Context.Cache.Add("sitemapxml", xml.ToString(), null, | |
DateTime.Now.AddSeconds(int.Parse(cacheTime)), | |
Cache.NoSlidingExpiration, | |
CacheItemPriority.Normal, | |
null); | |
args.Context.Response.Flush(); | |
args.Context.Response.End(); | |
} | |
} | |
/// <summary> | |
/// Identify the items with a presentation detail | |
/// </summary> | |
/// <param name="item">Item to check</param> | |
/// <returns></returns> | |
private bool IsPage(Item item) | |
{ | |
var result = false; | |
var layoutField = new LayoutField(item.Fields[FieldIDs.LayoutField]); | |
if (!layoutField.InnerField.HasValue || string.IsNullOrEmpty(layoutField.Value)) return false; | |
var layout = LayoutDefinition.Parse(layoutField.Value); | |
foreach (var deviceObj in layout.Devices) | |
{ | |
var device = deviceObj as DeviceDefinition; | |
if (device == null) return false; | |
if (device.Renderings.Count > 0) | |
{ | |
result = true; | |
} | |
} | |
return result; | |
} | |
} | |
} |