aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorJauhien Piatlicki (jauhien) <piatlicki@gmail.com>2013-07-25 01:32:43 +0200
committerJauhien Piatlicki (jauhien) <piatlicki@gmail.com>2013-07-25 01:32:43 +0200
commit189f6b962da3a77695a3ee7d13e2104b51637580 (patch)
treebf0afc04f0daa19109c6d5926b4a5b4e14a097b2 /gs_pypi
parentPyPI backend: experiments (diff)
downloadg-sorcery-189f6b962da3a77695a3ee7d13e2104b51637580.tar.gz
g-sorcery-189f6b962da3a77695a3ee7d13e2104b51637580.tar.bz2
g-sorcery-189f6b962da3a77695a3ee7d13e2104b51637580.zip
PyPI backend: obtain metadata from the site
Diffstat (limited to 'gs_pypi')
-rw-r--r--gs_pypi/pypi_db.py69
1 files changed, 19 insertions, 50 deletions
diff --git a/gs_pypi/pypi_db.py b/gs_pypi/pypi_db.py
index 71e5397..3c3e491 100644
--- a/gs_pypi/pypi_db.py
+++ b/gs_pypi/pypi_db.py
@@ -11,60 +11,29 @@
:license: GPL-2, see LICENSE for more details.
"""
-from g_sorcery.compatibility import py2k
+import bs4
-if py2k:
- import xmlrpclib
- import httplib
- urlparse
-else:
- import xmlrpc.client as xmlrpclib
- import http.client as httplib
- import urllib.parse as urlparse
-
-import sys
-
-from g_sorcery.logger import Logger
from g_sorcery.package_db import DBGenerator
class PypiDBGenerator(DBGenerator):
- def process_uri(self, uri, data):
- url = uri["uri"]
- client = xmlrpclib.ServerProxy(url)
- logger = Logger()
- logger.info("downloading packages data")
- pkg_list = client.list_packages()
-
- number_of_packages = len(pkg_list)
- downloaded_number = 0
-
- connection = httplib.HTTPConnection(urlparse.urlparse(url).netloc)
-
- connection.request("GET", "/pypi/zmqpy/json")
- response = connection.getresponse()
- print(response.getheaders())
-
- for pkg in pkg_list:
- data[pkg] = {}
-
- chars = ['-','\\','|','/']
- show = chars[downloaded_number % 4]
- percent = (downloaded_number * 100)//number_of_packages
- length = 70
- progress = (percent * length)//100
- blank = length - progress
-
- sys.stdout.write("\r %s [%s%s] %s%%" % (show, "#" * progress, " " * blank, percent))
- sys.stdout.flush()
- downloaded_number += 1
-
- connection.close()
-
- sys.stdout.write("\r %s [%s] %s%%" % ("-", "#" * length, 100))
- sys.stdout.flush()
- print("")
+ def get_download_uries(self, common_config, config):
+ return [config["repo_uri"] + "?%3Aaction=index"]
+ def parse_data(self, data_f):
+ soup = bs4.BeautifulSoup(data_f.read())
+ return soup.table
+
+
def process_data(self, pkg_db, data, common_config, config):
- #print(data)
- pass
+ data = data["pypi?:action=index"]
+ for entry in data.find_all("tr")[1:-1]:
+ package, description = entry.find_all("td")
+
+ if description.contents:
+ description = description.contents[0]
+ else:
+ description = ""
+ package, version = package.a["href"].split("/")[2:]
+
+ print(package, version, description)