new spells: w3lib & scrapy

author: Ismael Luceno 2011-05-31 14:42:04 -0300
committer: Ismael Luceno 2011-05-31 15:50:15 -0300
commit: 7fa8c55e5439e39d482e668e085a2799bff8b021 (patch)
tree: 3fa946b8382bf5ae2f27ed89dab2b18540438e5d
parent: 7193282772e7fb7a623db83752237b9cf799f00b (diff)
7 files changed, 55 insertions, 0 deletions
diff --git a/ChangeLog b/ChangeLog
index 33823a4738..606935a57f 100644
--- a/ChangeLog
+++ b/ChangeLog
@@ -1,3 +1,7 @@
+2011-05-31 Ismael Luceno <ismael@sourcemage.org>
+	* python-pypi/w3lib: new spell, Library of web-relatedfunctions
+	* python-pypi/scrapy: new spell, A high-level Python Screen Scraping framework
+
 2011-05-31 Treeve Jelbert <treeve@sourcemage.org>
 	* python-pypi/geraldo: new spell, python reporting engine
 
diff --git a/python-pypi/scrapy/DEPENDS b/python-pypi/scrapy/DEPENDS
new file mode 100755
index 0000000000..ff175185e3
--- /dev/null
+++ b/python-pypi/scrapy/DEPENDS
@@ -0,0 +1,7 @@
+depends python       &&
+depends SETUPTOOLS   &&
+depends twisted      &&
+depends lxml         &&
+depends simplejson   &&
+depends w3lib        &&
+depends pyopenssl
diff --git a/python-pypi/scrapy/DETAILS b/python-pypi/scrapy/DETAILS
new file mode 100755
index 0000000000..322ecf65a3
--- /dev/null
+++ b/python-pypi/scrapy/DETAILS
@@ -0,0 +1,16 @@
+           SPELL=scrapy
+          SPELLX=Scrapy
+         VERSION=0.12.0.2542
+     SOURCE_HASH=sha512:b9346a3f723e241df5a6164d5f938f4c39e83fff7c275d450f6bea0de9686ccf6be26ce6b27e0ae9e7917495010ecb29c12f49091e26c858e51883cd4cab1507
+          SOURCE=$SPELLX-$VERSION.tar.gz
+   SOURCE_URL[0]=http://pypi.python.org/packages/source/S/$SPELLX/$SOURCE
+SOURCE_DIRECTORY="$BUILD_DIRECTORY/$SPELLX-$VERSION"
+        WEB_SITE=http://scrapy.org/
+      LICENSE[0]=BSD
+         UPDATED=20110531
+           SHORT='A high-level Python Screen Scraping framework'
+cat << EOF
+Scrapy is a high level scraping and web crawling framework for writing spiders
+to crawl and parse web pages for all kinds of purposes, from information
+retrieval to monitoring or testing web sites.
+EOF
diff --git a/python-pypi/scrapy/HISTORY b/python-pypi/scrapy/HISTORY
new file mode 100644
index 0000000000..6b244bfa43
--- /dev/null
+++ b/python-pypi/scrapy/HISTORY
@@ -0,0 +1,2 @@
+2011-05-31 Ismael Luceno <ismael@sourcemage.org>
+	* DEPENDS, DETAILS: spell created
diff --git a/python-pypi/w3lib/DEPENDS b/python-pypi/w3lib/DEPENDS
new file mode 100755
index 0000000000..84a0acc92a
--- /dev/null
+++ b/python-pypi/w3lib/DEPENDS
@@ -0,0 +1,2 @@
+depends python       &&
+depends SETUPTOOLS
diff --git a/python-pypi/w3lib/DETAILS b/python-pypi/w3lib/DETAILS
new file mode 100755
index 0000000000..df50dad871
--- /dev/null
+++ b/python-pypi/w3lib/DETAILS
@@ -0,0 +1,22 @@
+           SPELL=w3lib
+         VERSION=1.0
+     SOURCE_HASH=sha512:007c6c08708c97be542937c598731dea07449e67ec90c5ce66aec5dce9286681ab04c007ed180fa1b7274ae74ecb8dc3c6520e422debee6f0420d9817f30bc03
+          SOURCE=$SPELL-$VERSION.tar.gz
+   SOURCE_URL[0]=http://pypi.python.org/packages/source/w/$SPELL/$SOURCE
+SOURCE_DIRECTORY="$BUILD_DIRECTORY/$SPELL-$VERSION"
+        WEB_SITE=http://github.com/scrapy/w3lib
+      LICENSE[0]=BSD
+         UPDATED=20110531
+           SHORT='Library of web-related functions'
+cat << EOF
+This is a Python library of web-related functions, such as:
+* remove comments, or tags from HTML snippets
+* extract base url from HTML snippets
+* translate entites on HTML strings
+* encoding mulitpart/form-data
+* convert raw HTTP headers to dicts and vice-versa
+* construct HTTP auth header
+* RFC-compliant url joining
+* sanitize urls (like browsers do)
+* extract arguments from urls
+EOF
diff --git a/python-pypi/w3lib/HISTORY b/python-pypi/w3lib/HISTORY
new file mode 100644
index 0000000000..6b244bfa43
--- /dev/null
+++ b/python-pypi/w3lib/HISTORY
@@ -0,0 +1,2 @@
+2011-05-31 Ismael Luceno <ismael@sourcemage.org>
+	* DEPENDS, DETAILS: spell created
author	Ismael Luceno	2011-05-31 14:42:04 -0300
committer	Ismael Luceno	2011-05-31 15:50:15 -0300
commit	7fa8c55e5439e39d482e668e085a2799bff8b021 (patch)
tree	3fa946b8382bf5ae2f27ed89dab2b18540438e5d
parent	7193282772e7fb7a623db83752237b9cf799f00b (diff)