content/doap.rdf (255 lines of code) (raw):

<?xml version="1.0"?> <?xml-stylesheet type="text/xsl"?> <rdf:RDF xml:lang="en" xmlns="http://usefulinc.com/ns/doap#" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:asfext="http://projects.apache.org/ns/asfext#" xmlns:foaf="http://xmlns.com/foaf/0.1/"> <!-- Licensed to the Apache Software Foundation (ASF) under one or more contributor license agreements. See the NOTICE file distributed with this work for additional information regarding copyright ownership. The ASF licenses this file to You under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. --> <Project rdf:about="https://nutch.apache.org"> <created>2011-07-21</created> <license rdf:resource="http://www.apache.org/licenses/LICENSE-2.0" /> <name>Apache Nutch</name> <homepage rdf:resource="https://nutch.apache.org" /> <asfext:pmc rdf:resource="https://nutch.apache.org" /> <shortdesc>Apache Nutch is an open source web crawler software project.</shortdesc> <description>Apache Nutch is a highly extensible and scalable open source web crawler software project. Stemming from Apache Lucene, Nutch is a well matured, production ready batch crawler relying on Apache Hadoop data structures, which are great for batch processing. Nutch has a modular architecture and provides pluggable and extensible interfaces such as Parse, Index and ScoringFilter's for custom implementations e.g. Apache Tika for parsing. Additionally, pluggable indexers exists for Apache Solr, Elastic Search, etc. Nutch can run on a single machine, but gains a lot of its strength from running in a Hadoop cluster. The now retired branch Nutch 2.x differed from 1.x in one key area: storage is abstracted away from any specific underlying data store by using Apache Gora for handling object to persistent mappings and to store fetch time, status, content, parsed text, outlinks, inlinks, etc. into a number of NoSQL storage solutions.</description> <bug-database rdf:resource="https://issues.apache.org/jira/projects/NUTCH" /> <mailing-list rdf:resource="https://nutch.apache.org/mailing_lists.html" /> <download-page rdf:resource="https://www.apache.org/dyn/closer.cgi/nutch/" /> <programming-language>Java</programming-language> <category rdf:resource="https://projects.apache.org/category/web-framework" /> <release> <Version> <name>Apache Nutch 1.19</name> <created>2022-08-22</created> <revision>1.19</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.18</name> <created>2021-01-14</created> <revision>1.18</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.17</name> <created>2020-06-18</created> <revision>1.17</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.16</name> <created>2019-10-11</created> <revision>1.16</revision> </Version> </release> <release> <Version> <name>Apache Nutch 2.4</name> <created>2019-10-11</created> <revision>2.4</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.15</name> <created>2018-08-09</created> <revision>1.15</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.14</name> <created>2017-12-22</created> <revision>1.14</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.13</name> <created>2017-04-02</created> <revision>1.13</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.12</name> <created>2016-06-18</created> <revision>1.12</revision> </Version> </release> <release> <Version> <name>Apache Nutch 2.3.1</name> <created>2016-01-21</created> <revision>2.3.1</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.11</name> <created>2015-12-07</created> <revision>1.11</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.10</name> <created>2015-05-06</created> <revision>1.10</revision> </Version> </release> <release> <Version> <name>Apache Nutch 2.3</name> <created>2015-01-22</created> <revision>2.3</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.9</name> <created>2014-08-16</created> <revision>1.9</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.8</name> <created>2014-03-17</created> <revision>1.8</revision> </Version> </release> <release> <Version> <name>Apache Nutch 2.2.1</name> <created>2013-07-02</created> <revision>2.2.1</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.7</name> <created>2013-06-24</created> <revision>1.7</revision> </Version> </release> <release> <Version> <name>Apache Nutch 2.2</name> <created>2013-06-05</created> <revision>2.2</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.6</name> <created>2012-12-06</created> <revision>1.6</revision> </Version> </release> <release> <Version> <name>Apache Nutch 2.1</name> <created>2012-10-05</created> <revision>1.5.1</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.5.1</name> <created>2012-07-10</created> <revision>1.5.1</revision> </Version> </release> <release> <Version> <name>Apache Nutch 2.0</name> <created>2012-07-07</created> <revision>2.0</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.5</name> <created>2012-06-07</created> <revision>1.5</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.4</name> <created>2011-04-11</created> <revision>1.4</revision> </Version> </release> <release> <Version> <name>Apache Nutch 1.3</name> <created>2011-06-07</created> <revision>1.3</revision> </Version> </release> <release> <Version> <branch>branch-1.0</branch> <name>nutch-1.0</name> <created>2009-03-23</created> <revision>1.0</revision> </Version> </release> <release> <Version> <branch>branch-0.9</branch> <name>nutch-0.9</name> <created>2007-04-01</created> <revision>0.9</revision> </Version> </release> <release> <Version> <branch>branch-0.8</branch> <name>nutch-0.8.1</name> <created>2006-09-24</created> <revision>0.8.1</revision> </Version> </release> <release> <Version> <branch>branch-0.8</branch> <name>nutch-0.8</name> <created>2006-06-25</created> <revision>0.8</revision> </Version> </release> <release> <Version> <branch>branch-0.7</branch> <name>nutch-0.7.2</name> <created>2006-03-31</created> <revision>0.7.2</revision> </Version> </release> <repository> <GitRepository> <location rdf:resource="https://gitbox.apache.org/repos/asf/nutch.git"/> <browse rdf:resource="https://gitbox.apache.org/repos/asf?p=nutch.git;a=summary"/> </GitRepository> </repository> <repository> <GitRepository> <location rdf:resource="https://github.com/apache/nutch.git"/> <browse rdf:resource="https://github.com/apache/nutch/"/> </GitRepository> </repository> <maintainer> <foaf:Person> <foaf:name>Nutch PMC</foaf:name> <foaf:mbox rdf:resource="mailto:dev@nutch.apache.org"/> </foaf:Person> </maintainer> </Project> </rdf:RDF>