<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>DocumentCloud &#187; Code</title>
	<atom:link href="http://blog.documentcloud.org/blog/category/code/feed/" rel="self" type="application/rss+xml" />
	<link>http://blog.documentcloud.org</link>
	<description>Just another WordPress site</description>
	<lastBuildDate>Thu, 05 Apr 2012 14:24:15 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.org/?v=3.3.2</generator>
		<item>
		<title>Code Release: Backbone.js 0.5.0</title>
		<link>http://blog.documentcloud.org/blog/2011/07/code-release-backbone-js-0-5-0/</link>
		<comments>http://blog.documentcloud.org/blog/2011/07/code-release-backbone-js-0-5-0/#comments</comments>
		<pubDate>Fri, 01 Jul 2011 18:06:57 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=145672</guid>
		<description><![CDATA[After being on the slow burner for several months, Backbone.js 0.5.0 was released this afternoon. Backbone is the JavaScript library that DocumentCloud uses to build out the workspace where reporters can upload, edit and organize their primary source documents. Along with a slew of tweaks and bug fixes, the most notable new feature is HTML5 [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2011/07/code-release-backbone-js-0-5-0/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Code Drop: VisualSearch.js</title>
		<link>http://blog.documentcloud.org/blog/2011/06/code-drop-visualsearch-js/</link>
		<comments>http://blog.documentcloud.org/blog/2011/06/code-drop-visualsearch-js/#comments</comments>
		<pubDate>Thu, 23 Jun 2011 16:23:58 +0000</pubDate>
		<dc:creator>Samuel Clay</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=145661</guid>
		<description><![CDATA[Over the past two years, we have released much of our toolset as open-source code: Backbone.js, Underscore.js, Jammit, CloudCrowd, and others. Today, we&#8217;re launching another piece of DocumentCloud — both on DocumentCloud.org and as a component you can integrate into your own projects. VisualSearch.js is a rich search box for real data. It enhances ordinary search boxes with [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2011/06/code-drop-visualsearch-js/feed/</wfw:commentRss>
		<slash:comments>7</slash:comments>
		</item>
		<item>
		<title>Improving the Quality of OCR</title>
		<link>http://blog.documentcloud.org/blog/2010/11/improving-the-quality-of-ocr/</link>
		<comments>http://blog.documentcloud.org/blog/2010/11/improving-the-quality-of-ocr/#comments</comments>
		<pubDate>Mon, 15 Nov 2010 20:09:32 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>
		<category><![CDATA[Workspace]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=608</guid>
		<description><![CDATA[When you upload a document to DocumentCloud, and the file does not contain text, we attempt to perform OCR (optical character recognition) on the document, using the open source Tesseract project. Tesseract is a venerable piece of software, originally developed at Hewlett-Packard between 1985 and 1995. Google acquired the project in 2006, and has been [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2010/11/improving-the-quality-of-ocr/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Code Drop: Backbone.js</title>
		<link>http://blog.documentcloud.org/blog/2010/10/code-drop-backbone-js/</link>
		<comments>http://blog.documentcloud.org/blog/2010/10/code-drop-backbone-js/#comments</comments>
		<pubDate>Wed, 13 Oct 2010 16:32:15 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=592</guid>
		<description><![CDATA[Another little piece of DocumentCloud is now available: Backbone supplies structure to JavaScript-heavy applications by providing models with key-value binding and custom events, collections with a rich API of enumerable functions, views with declarative event handling, and connects it all to your existing application over a RESTful JSON interface. We make heavy use of Backbone [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2010/10/code-drop-backbone-js/feed/</wfw:commentRss>
		<slash:comments>17</slash:comments>
		</item>
		<item>
		<title>Evaluating Amazon&#8217;s EC2 Micro Instances</title>
		<link>http://blog.documentcloud.org/blog/2010/09/evaluating-amazons-ec2-micro-instances/</link>
		<comments>http://blog.documentcloud.org/blog/2010/09/evaluating-amazons-ec2-micro-instances/#comments</comments>
		<pubDate>Wed, 15 Sep 2010 17:49:42 +0000</pubDate>
		<dc:creator>Samuel Clay</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=527</guid>
		<description><![CDATA[Here at DocumentCloud, we&#8217;re constantly turning PDF files and Office documents into embeddable document viewers. We extract text from the documents with OCR and generate images at multiple sizes for each of the thousands of pages we process every day. To crunch all of this data, we rely on High-CPU Medium instances on Amazon EC2, [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2010/09/evaluating-amazons-ec2-micro-instances/feed/</wfw:commentRss>
		<slash:comments>13</slash:comments>
		</item>
		<item>
		<title>Code Drop: Pixel Ping</title>
		<link>http://blog.documentcloud.org/blog/2010/09/code-drop-pixel-ping/</link>
		<comments>http://blog.documentcloud.org/blog/2010/09/code-drop-pixel-ping/#comments</comments>
		<pubDate>Wed, 08 Sep 2010 17:24:40 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=488</guid>
		<description><![CDATA[At this point at the end of our first summer, over 30 newsrooms are using DocumentCloud to augment their reporting by publishing selected source documents. You can see some examples of DocumentCloud in action on our list of featured documents or our recent MediaShift post. We&#8217;ll soon be allowing the general public to search the [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2010/09/code-drop-pixel-ping/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Introducing Page Notes</title>
		<link>http://blog.documentcloud.org/blog/2010/07/introducing-page-notes/</link>
		<comments>http://blog.documentcloud.org/blog/2010/07/introducing-page-notes/#comments</comments>
		<pubDate>Tue, 27 Jul 2010 16:13:33 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=368</guid>
		<description><![CDATA[The Document Viewer has always supported the ability to create &#8220;page notes&#8221; &#8212; annotations that sit between two pages and provide commentary about a specific page as a whole or an introduction to a new section of a document. This morning, we released an update to DocumentCloud that provides a way for you to create [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2010/07/introducing-page-notes/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>HTTPS Support (and Other Updates)</title>
		<link>http://blog.documentcloud.org/blog/2010/07/https-support-and-other-updates/</link>
		<comments>http://blog.documentcloud.org/blog/2010/07/https-support-and-other-updates/#comments</comments>
		<pubDate>Tue, 20 Jul 2010 14:15:59 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=345</guid>
		<description><![CDATA[Monday morning we rolled out SSL support on DocumentCloud.org &#8212; visit https://www.documentcloud.org to view, browse and edit documents in your workspace over an encrypted connection. When you use HTTPS, all traffic between your computer and DocumentCloud is encrypted before it&#8217;s sent over the internet. If you&#8217;re working on a public wireless connection, are on an [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2010/07/https-support-and-other-updates/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Bidding IE6 Adieu</title>
		<link>http://blog.documentcloud.org/blog/2010/07/bidding-ie6-adieu/</link>
		<comments>http://blog.documentcloud.org/blog/2010/07/bidding-ie6-adieu/#comments</comments>
		<pubDate>Fri, 09 Jul 2010 22:18:38 +0000</pubDate>
		<dc:creator>Amanda Hickman</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=317</guid>
		<description><![CDATA[Last week, we rolled out an update to DocumentCloud&#8217;s document viewer that included a wide range of improvements that you might never even notice. Page layouts and scrolling look very different under the hood, pages load and scroll much faster now, annotations work better, readers can resize a document viewer without setting off a barrage [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2010/07/bidding-ie6-adieu/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Collaboration</title>
		<link>http://blog.documentcloud.org/blog/2010/06/collaboration/</link>
		<comments>http://blog.documentcloud.org/blog/2010/06/collaboration/#comments</comments>
		<pubDate>Mon, 28 Jun 2010 14:44:00 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>
		<category><![CDATA[Workspace]]></category>

		<guid isPermaLink="false">http://blog.documentcloud.org/?p=291</guid>
		<description><![CDATA[Since we launched DocumentCloud&#8217;s beta, one of the most common requests has been: &#8220;How can I share documents with reporters from other organizations?&#8221; Now you can share a project with any other DocumentCloud user &#8212; in any newsroom. How does it work? Let&#8217;s say I have a project with documents relating to the Madoff Ponzi [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2010/06/collaboration/feed/</wfw:commentRss>
		<slash:comments>2</slash:comments>
		</item>
		<item>
		<title>Announcing Docsplit: Break Documents into Images, Pages, and Plain Text</title>
		<link>http://blog.documentcloud.org/blog/2009/12/announcing-docsplit-break-documents-into-images-pages-and-plain-text/</link>
		<comments>http://blog.documentcloud.org/blog/2009/12/announcing-docsplit-break-documents-into-images-pages-and-plain-text/#comments</comments>
		<pubDate>Mon, 07 Dec 2009 15:17:05 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://www.documentcloud.org/blog/?p=87</guid>
		<description><![CDATA[We&#8217;ve been spending a lot of time in the DocumentCloud Lab researching the best way to break apart documents into their component parts, to make it easier to index them for searching and to display them on the web. The latest open-source piece of DocumentCloud is a tool to help you extract images, thumbnails, plain [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2009/12/announcing-docsplit-break-documents-into-images-pages-and-plain-text/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Announcing Jammit: DocumentCloud&#8217;s Asset Packager</title>
		<link>http://blog.documentcloud.org/blog/2009/11/announcing-jammit-documentclouds-asset-packager/</link>
		<comments>http://blog.documentcloud.org/blog/2009/11/announcing-jammit-documentclouds-asset-packager/#comments</comments>
		<pubDate>Mon, 16 Nov 2009 15:35:43 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://www.documentcloud.org/blog/?p=75</guid>
		<description><![CDATA[The DocumentCloud prototype includes a &#8220;Journalist Workspace&#8221; — a tool for searching, organizing, and visualizing the relationships among documents. We&#8217;re building the workspace as a modern web application, which means that there&#8217;s a lot of static assets behind the scenes (JavaScript, templates, CSS, and images). The problem arises: how do you keep all of these [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2009/11/announcing-jammit-documentclouds-asset-packager/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Underscore.js: Our Second Open-Source Release</title>
		<link>http://blog.documentcloud.org/blog/2009/10/underscore-dot-js/</link>
		<comments>http://blog.documentcloud.org/blog/2009/10/underscore-dot-js/#comments</comments>
		<pubDate>Wed, 28 Oct 2009 13:51:00 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://www.documentcloud.org/blog/?p=51</guid>
		<description><![CDATA[We released the first open-source component of DocumentCloud a little over a month ago. Since then CloudCrowd has picked up a lot of steam, with hundreds of developers watching it on GitHub, and many patches and features being contributed by the community. Among other uses, it&#8217;s running gene sequence analysis on strains of influenza virus — [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2009/10/underscore-dot-js/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
		</item>
		<item>
		<title>Two Dozen Media Outlets and Others Join Us as Beta Testers</title>
		<link>http://blog.documentcloud.org/blog/2009/09/two-dozen-media-outlets-and-others-join-us-as-beta-testers/</link>
		<comments>http://blog.documentcloud.org/blog/2009/09/two-dozen-media-outlets-and-others-join-us-as-beta-testers/#comments</comments>
		<pubDate>Thu, 24 Sep 2009 12:00:05 +0000</pubDate>
		<dc:creator>Scott</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://www.documentcloud.org/blog/?p=32</guid>
		<description><![CDATA[We have some more news: About two dozen news and other organizations have signed on as beta-testers. They&#8217;ll be contributing documents to DocumentCloud, and giving us feedback as we work out the kinks. It&#8217;s a wide-ranging list: ACLU National Security Project Arizona Republic The Atlantic Center for Democracy and Technology / OpenCRS Centre for Investigative [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2009/09/two-dozen-media-outlets-and-others-join-us-as-beta-testers/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Thomson Reuters and OpenCalais</title>
		<link>http://blog.documentcloud.org/blog/2009/09/thomson-reuters-opencalais/</link>
		<comments>http://blog.documentcloud.org/blog/2009/09/thomson-reuters-opencalais/#comments</comments>
		<pubDate>Thu, 24 Sep 2009 11:30:02 +0000</pubDate>
		<dc:creator>Scott</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://www.documentcloud.org/blog/?p=34</guid>
		<description><![CDATA[This morning we&#8217;re excited to announce a partnership with Thomson Reuters, which is contributing its OpenCalais service to DocumentCloud. OpenCalais uses natural language processing to extract information from documents, instantly identifying and tagging the relevant people, places, companies, facts and events. This will make it easy for readers and journalists to explore connections between documents [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2009/09/thomson-reuters-opencalais/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
		</item>
		<item>
		<title>CloudCrowd — Parallel Processing for the Rest of Us</title>
		<link>http://blog.documentcloud.org/blog/2009/09/cloudcrowd-parallel-processing-for-the-rest-of-us/</link>
		<comments>http://blog.documentcloud.org/blog/2009/09/cloudcrowd-parallel-processing-for-the-rest-of-us/#comments</comments>
		<pubDate>Mon, 14 Sep 2009 13:29:46 +0000</pubDate>
		<dc:creator>Jeremy Ashkenas</dc:creator>
				<category><![CDATA[Code]]></category>

		<guid isPermaLink="false">http://www.documentcloud.org/blog/?p=15</guid>
		<description><![CDATA[As we began to prototype DocumentCloud, it quickly became apparent that we&#8217;re going to need a heavy-duty system for document processing. Our PDFs need to have their text extracted, their images scaled and converted, and their entities extracted for later cataloging. All of these things are computationally expensive, keeping your laptop hot and busy for minutes, [...]]]></description>
		<wfw:commentRss>http://blog.documentcloud.org/blog/2009/09/cloudcrowd-parallel-processing-for-the-rest-of-us/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
	</channel>
</rss>

