diff options
Diffstat (limited to 'lib/utils/pydelicious.py')
-rw-r--r-- | lib/utils/pydelicious.py | 858 |
1 files changed, 543 insertions, 315 deletions
diff --git a/lib/utils/pydelicious.py b/lib/utils/pydelicious.py index dd33788..8e45843 100644 --- a/lib/utils/pydelicious.py +++ b/lib/utils/pydelicious.py @@ -1,131 +1,126 @@ """Library to access del.icio.us data via Python. -:examples: - - Using the API class directly: - - >>> a = pydelicious.apiNew('user', 'passwd') - >>> # or: - >>> a = DeliciousAPI('user', 'passwd') - >>> a.tags_get() # Same as: - >>> a.request('tags/get', ) - - Or by calling one of the methods on the module: - - - add(user, passwd, url, description, tags = "", extended = "", dt = "", replace="no") - - get(user, passwd, tag="", dt="", count = 0) - - get_all(user, passwd, tag = "") - - delete(user, passwd, url) - - rename_tag(user, passwd, oldtag, newtag) - - get_tags(user, passwd) - - >>> a = apiNew(user, passwd) - >>> a.posts_add(url="http://my.com/", desciption="my.com", extended="the url is my.moc", tags="my com") - True - >>> len(a.posts_all()) - 1 - >>> get_all(user, passwd) - 1 - - This are short functions for getrss calls. - - >>> rss_ - -def get_userposts(user): -def get_tagposts(tag): -def get_urlposts(url): -def get_popular(tag = ""): - - >>> json_posts() - >>> json_tags() - >>> json_network() - >>> json_fans() - -:License: pydelicious is released under the BSD license. See 'license.txt' - for more informations. - -:todo, bvb: - - Rewriting comments to english. More documentation, examples. - - Added JSON-like return values for XML data (del.icio.us also serves some JSON...) - - better error/exception classes and handling, work in progress. - -:todo: - - Source code SHOULD BE ASCII! - - More tests. - - handling different encodings, what, how? - >>> pydelicious.getrss(tag="t[a]g") - url: http://del.icio.us/rss/tag/t[a]g - - Parse datetimes in XML. - - Test RSS functionality? HTML scraping doesn't work yet? - - API functions need required argument checks. - - interesting functionality in other libraries (ruby, java, perl, etc)? - - what is pydelicious used for? - - license, readme docs via setup.py verdelen? - - automatic releas build - -:done: - * Refactored the API class, much cleaner now and functions dlcs_api_request, dlcs_parse_xml are available for who wants them. +An introduction to the project is given in the README. +pydelicious is released under the BSD license. See license.txt for details +and the copyright holders. + +THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND +ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED +WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE +DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR +ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES +(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; +LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON +ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT +(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS +SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. + +TODO: + - distribute license, readme docs via setup.py? + - automatic release build? """ import sys import os import time import datetime -import md5, httplib -import urllib, urllib2, time +import locale +import httplib +import urllib2 +from urllib import urlencode, quote_plus from StringIO import StringIO +from pprint import pformat + +v = sys.version_info +if v[0] >= 2 and v[1] >= 5: + from hashlib import md5 +else: + from md5 import md5 try: from elementtree.ElementTree import parse as parse_xml except ImportError: - from xml.etree.ElementTree import parse as parse_xml + # Python 2.5 and higher + from xml.etree.ElementTree import parse as parse_xml -import feedparser +try: + import feedparser +except ImportError: + print >>sys.stderr, \ + "Feedparser not available, no RSS parsing." + feedparser = None ### Static config -__version__ = '0.5.0' -__author__ = 'Frank Timmermann <regenkind_at_gmx_dot_de>' # GP: does not respond to emails +__version__ = '0.5.3' +__author__ = 'Frank Timmermann <regenkind_at_gmx_dot_de>' + # GP: does not respond to emails __contributors__ = [ 'Greg Pinero', 'Berend van Berkum <berend+pydelicious@dotmpe.com>'] __url__ = 'http://code.google.com/p/pydelicious/' -__author_email__ = "" # Old URL: 'http://deliciouspython.python-hosting.com/' - -__description__ = '''pydelicious.py allows you to access the web service of del.icio.us via it's API through python.''' -__long_description__ = '''the goal is to design an easy to use and fully functional python interface to del.icio.us. ''' - -DLCS_OK_MESSAGES = ('done', 'ok') # Known text values of positive del.icio.us <result> answers +__author_email__ = "" +__docformat__ = "restructuredtext en" +__description__ = "pydelicious.py allows you to access the web service of " \ + "del.icio.us via it's API through Python." +__long_description__ = "The goal is to design an easy to use and fully " \ + "functional Python interface to del.icio.us." + +DLCS_OK_MESSAGES = ('done', 'ok') +"Known text values of positive del.icio.us <result/> answers" DLCS_WAIT_TIME = 4 -DLCS_REQUEST_TIMEOUT = 444 # Seconds before socket triggers timeout +"Time to wait between API requests" +DLCS_REQUEST_TIMEOUT = 444 +"Seconds before socket triggers timeout" #DLCS_API_REALM = 'del.icio.us API' -DLCS_API_HOST = 'https://api.del.icio.us' +DLCS_API_HOST = 'api.del.icio.us' DLCS_API_PATH = 'v1' -DLCS_API = "%s/%s" % (DLCS_API_HOST, DLCS_API_PATH) +DLCS_API = "https://%s/%s" % (DLCS_API_HOST, DLCS_API_PATH) DLCS_RSS = 'http://del.icio.us/rss/' +DLCS_FEEDS = 'http://feeds.delicious.com/v2/' + +PREFERRED_ENCODING = locale.getpreferredencoding() +# XXX: might need to check sys.platform/encoding combinations here, ie +#if sys.platform == 'darwin' || PREFERRED_ENCODING == 'macroman: +# PREFERRED_ENCODING = 'utf-8' +if not PREFERRED_ENCODING: + PREFERRED_ENCODING = 'iso-8859-1' ISO_8601_DATETIME = '%Y-%m-%dT%H:%M:%SZ' -USER_AGENT = 'pydelicious.py/%s %s' % (__version__, __url__) +USER_AGENT = 'pydelicious/%s %s' % (__version__, __url__) DEBUG = 0 if 'DLCS_DEBUG' in os.environ: DEBUG = int(os.environ['DLCS_DEBUG']) - - -# Taken from FeedParser.py -# timeoutsocket allows feedparser to time out rather than hang forever on ultra-slow servers. -# Python 2.3 now has this functionality available in the standard socket library, so under -# 2.3 you don't need to install anything. But you probably should anyway, because the socket -# module is buggy and timeoutsocket is better. + if DEBUG: + print >>sys.stderr, \ + "Set DEBUG to %i from DLCS_DEBUG env." % DEBUG + +HTTP_PROXY = None +if 'HTTP_PROXY' in os.environ: + HTTP_PROXY = os.environ['HTTP_PROXY'] + if DEBUG: + print >>sys.stderr, \ + "Set HTTP_PROXY to %i from env." % HTTP_PROXY + +### Timeoutsocket hack taken from FeedParser.py + +# timeoutsocket allows feedparser to time out rather than hang forever on ultra- +# slow servers. Python 2.3 now has this functionality available in the standard +# socket library, so under 2.3 you don't need to install anything. But you +# probably should anyway, because the socket module is buggy and timeoutsocket +# is better. try: import timeoutsocket # http://www.timo-tasi.org/python/timeoutsocket.py timeoutsocket.setDefaultSocketTimeout(DLCS_REQUEST_TIMEOUT) except ImportError: import socket - if hasattr(socket, 'setdefaulttimeout'): socket.setdefaulttimeout(DLCS_REQUEST_TIMEOUT) -if DEBUG: print >>sys.stderr, "Set socket timeout to %s seconds" % DLCS_REQUEST_TIMEOUT + if hasattr(socket, 'setdefaulttimeout'): + socket.setdefaulttimeout(DLCS_REQUEST_TIMEOUT) +if DEBUG: print >>sys.stderr, \ + "Set socket timeout to %s seconds" % DLCS_REQUEST_TIMEOUT ### Utility classes @@ -163,91 +158,64 @@ class _Waiter: Waiter = _Waiter(DLCS_WAIT_TIME) + class PyDeliciousException(Exception): - '''Std. pydelicious error''' - pass + """Standard pydelicious error""" +class PyDeliciousThrottled(Exception): pass +class PyDeliciousUnauthorized(Exception): pass class DeliciousError(Exception): """Raised when the server responds with a negative answer""" + @staticmethod + def raiseFor(error_string, path, **params): + if error_string == 'item already exists': + raise DeliciousItemExistsError, params['url'] + else: + raise DeliciousError, "%s, while calling <%s?%s>" % (error_string, + path, urlencode(params)) -class DefaultErrorHandler(urllib2.HTTPDefaultErrorHandler): - '''xxx, bvb: Where is this used? should it be registered somewhere with urllib2? - - Handles HTTP Error, currently only 503. - ''' - def http_error_503(self, req, fp, code, msg, headers): - raise urllib2.HTTPError(req, code, throttled_message, headers, fp) - +class DeliciousItemExistsError(DeliciousError): + """Raised then adding an already existing post.""" -class post(dict): - """Post object, contains href, description, hash, dt, tags, - extended, user, count(, shared). - xxx, bvb: Not used in DeliciousAPI - """ - def __init__(self, href="", description="", hash="", time="", tag="", extended="", user="", count="", - tags="", url="", dt=""): # tags or tag? - self["href"] = href - if url != "": self["href"] = url - self["description"] = description - self["hash"] = hash - self["dt"] = dt - if time != "": self["dt"] = time - self["tags"] = tags - if tag != "": self["tags"] = tag # tag or tags? # !! tags - self["extended"] = extended - self["user"] = user - self["count"] = count - - def __getattr__(self, name): - try: return self[name] - except: object.__getattribute__(self, name) - - -class posts(list): - def __init__(self, *args): - for i in args: self.append(i) - - def __getattr__(self, attr): - try: return [p[attr] for p in self] - except: object.__getattribute__(self, attr) +class HTTPErrorHandler(urllib2.HTTPDefaultErrorHandler): -### Utility functions + def http_error_401(self, req, fp, code, msg, headers): + raise PyDeliciousUnauthorized, "Check credentials." -def str2uni(s): - # type(in) str or unicode - # type(out) unicode - return ("".join([unichr(ord(i)) for i in s])) + def http_error_503(self, req, fp, code, msg, headers): + # Retry-After? + errmsg = "Try again later." + if 'Retry-After' in headers: + errmsg = "You may try again after %s" % headers['Retry-After'] + raise PyDeliciousThrottled, errmsg -def str2utf8(s): - # type(in) str or unicode - # type(out) str - return ("".join([unichr(ord(i)).encode("utf-8") for i in s])) -def str2quote(s): - return urllib.quote_plus("".join([unichr(ord(i)).encode("utf-8") for i in s])) +### Utility functions def dict0(d): - # Trims empty dict entries - # {'a':'a', 'b':'', 'c': 'c'} => {'a': 'a', 'c': 'c'} - dd = dict() - for i in d: - if d[i] != "": dd[i] = d[i] - return dd + "Removes empty string values from dictionary" + return dict([(k,v) for k,v in d.items() + if v=='' and isinstance(v, basestring)]) + def delicious_datetime(str): """Parse a ISO 8601 formatted string to a Python datetime ... """ return datetime.datetime(*time.strptime(str, ISO_8601_DATETIME)[0:6]) -def http_request(url, user_agent=USER_AGENT, retry=4): + +def http_request(url, user_agent=USER_AGENT, retry=4, opener=None): """Retrieve the contents referenced by the URL using urllib2. Retries up to four times (default) on exceptions. """ request = urllib2.Request(url, headers={'User-Agent':user_agent}) + if not opener: + opener = urllib2.build_opener() + # Remember last error e = None @@ -255,9 +223,10 @@ def http_request(url, user_agent=USER_AGENT, retry=4): tries = retry; while tries: try: - return urllib2.urlopen(request) + return opener.open(request) - except urllib2.HTTPError, e: # protocol errors, + except urllib2.HTTPError, e: + # reraise unexpected protocol errors as PyDeliciousException raise PyDeliciousException, "%s" % e except urllib2.URLError, e: @@ -273,50 +242,99 @@ def http_request(url, user_agent=USER_AGENT, retry=4): raise PyDeliciousException, \ "Unable to retrieve data at '%s', %s" % (url, e) -def http_auth_request(url, host, user, passwd, user_agent=USER_AGENT): - """Call an HTTP server with authorization credentials using urllib2. + +def build_api_opener(host, user, passwd, extra_handlers=() ): """ + Build a urllib2 style opener with HTTP Basic authorization for one host + and additional error handling. If HTTP_PROXY is set a proxyhandler is also + added. + """ + + global DEBUG + if DEBUG: httplib.HTTPConnection.debuglevel = 1 - # Hook up handler/opener to urllib2 password_manager = urllib2.HTTPPasswordMgrWithDefaultRealm() password_manager.add_password(None, host, user, passwd) auth_handler = urllib2.HTTPBasicAuthHandler(password_manager) - opener = urllib2.build_opener(auth_handler) - urllib2.install_opener(opener) - return http_request(url, user_agent) + extra_handlers += ( HTTPErrorHandler(), ) + if HTTP_PROXY: + extra_handlers += ( urllib2.ProxyHandler( {'http': HTTP_PROXY} ), ) + + return urllib2.build_opener(auth_handler, *extra_handlers) + + +def dlcs_api_opener(user, passwd): + "Build an opener for DLCS_API_HOST, see build_api_opener()" -def dlcs_api_request(path, params='', user='', passwd='', throttle=True): + return build_api_opener(DLCS_API_HOST, user, passwd) + + +def dlcs_api_request(path, params='', user='', passwd='', throttle=True, + opener=None): """Retrieve/query a path within the del.icio.us API. This implements a minimum interval between calls to avoid throttling. [#]_ Use param 'throttle' to turn this behaviour off. - todo: back off on 503's (HTTPError, URLError? testing - - Returned XML does not always correspond with given del.icio.us examples - [#]_. - .. [#] http://del.icio.us/help/api/ """ if throttle: Waiter() if params: - # params come as a dict, strip empty entries and urlencode - url = "%s/%s?%s" % (DLCS_API, path, urllib.urlencode(dict0(params))) + url = "%s/%s?%s" % (DLCS_API, path, urlencode(params)) else: url = "%s/%s" % (DLCS_API, path) - if DEBUG: print >>sys.stderr, "dlcs_api_request: %s" % url + if DEBUG: print >>sys.stderr, \ + "dlcs_api_request: %s" % url - try: - return http_auth_request(url, DLCS_API_HOST, user, passwd, USER_AGENT) + if not opener: + opener = dlcs_api_opener(user, passwd) + + fl = http_request(url, opener=opener) + + if DEBUG>2: print >>sys.stderr, \ + pformat(fl.info().headers) + + return fl + + +def dlcs_encode_params(params, usercodec=PREFERRED_ENCODING): + """Turn all param values (int, list, bool) into utf8 encoded strings. + """ + + if params: + for key in params.keys(): + if isinstance(params[key], bool): + if params[key]: + params[key] = 'yes' + else: + params[key] = 'no' + + elif isinstance(params[key], int): + params[key] = str(params[key]) + + elif not params[key]: + # strip/ignore empties other than False or 0 + del params[key] + continue + + elif isinstance(params[key], list): + params[key] = " ".join(params[key]) + + elif not isinstance(params[key], unicode): + params[key] = params[key].decode(usercodec) + + assert isinstance(params[key], basestring) + + params = dict([ (k, v.encode('utf8')) + for k, v in params.items() if v]) + + return params - # bvb: Is this ever raised? When? - except DefaultErrorHandler, e: - print >>sys.stderr, "%s" % e def dlcs_parse_xml(data, split_tags=False): """Parse any del.icio.us XML document and return Python data structure. @@ -332,6 +350,7 @@ def dlcs_parse_xml(data, split_tags=False): {'result':(True, "done")} # etcetera. """ + # TODO: split_tags is not implemented if DEBUG>3: print >>sys.stderr, "dlcs_parse_xml: parsing from ", data @@ -367,55 +386,67 @@ def dlcs_parse_xml(data, split_tags=False): else: msg = root.text - # Return {'result':(True, msg)} for /known/ O.K. messages, - # use (False, msg) otherwise + # XXX: Return {'result':(True, msg)} for /known/ O.K. messages, + # use (False, msg) otherwise. Move this to DeliciousAPI? v = msg in DLCS_OK_MESSAGES return {fmt: (v, msg)} elif fmt == 'update': # Update: "time" - #return {fmt: root.attrib} - return {fmt: {'time':time.strptime(root.attrib['time'], ISO_8601_DATETIME)}} + return {fmt: { + 'time':time.strptime(root.attrib['time'], ISO_8601_DATETIME) }} else: raise PyDeliciousException, "Unknown XML document format '%s'" % fmt -def dlcs_rss_request(tag = "", popular = 0, user = "", url = ''): - """Handle a request for RSS - - todo: translate from German - rss sollte nun wieder funktionieren, aber diese try, except scheisse ist so nicht schoen +def dlcs_rss_request(tag="", popular=0, user="", url=''): + """Parse a RSS request. - rss wird unterschiedlich zusammengesetzt. ich kann noch keinen einheitlichen zusammenhang - zwischen daten (url, desc, ext, usw) und dem feed erkennen. warum k[o]nnen die das nicht einheitlich machen? + This requests old (now undocumented?) URL paths that still seem to work. """ - tag = str2quote(tag) - user = str2quote(user) + + tag = quote_plus(tag) + user = quote_plus(user) + if url != '': # http://del.icio.us/rss/url/efbfb246d886393d48065551434dab54 - url = DLCS_RSS + '''url/%s'''%md5.new(url).hexdigest() + url = DLCS_RSS + 'url/%s' % md5(url).hexdigest() + elif user != '' and tag != '': - url = DLCS_RSS + '''%(user)s/%(tag)s'''%dict(user=user, tag=tag) + url = DLCS_RSS + '%(user)s/%(tag)s' % {'user':user, 'tag':tag} + elif user != '' and tag == '': # http://del.icio.us/rss/delpy - url = DLCS_RSS + '''%s'''%user + url = DLCS_RSS + '%s' % user + elif popular == 0 and tag == '': url = DLCS_RSS + elif popular == 0 and tag != '': # http://del.icio.us/rss/tag/apple # http://del.icio.us/rss/tag/web2.0 - url = DLCS_RSS + "tag/%s"%tag + url = DLCS_RSS + "tag/%s" % tag + elif popular == 1 and tag == '': - url = DLCS_RSS + '''popular/''' + url = DLCS_RSS + 'popular/' + elif popular == 1 and tag != '': - url = DLCS_RSS + '''popular/%s'''%tag + url = DLCS_RSS + 'popular/%s' % tag + + if DEBUG: + print 'dlcs_rss_request', url + rss = http_request(url).read() + + # assert feedparser, "dlcs_rss_request requires feedparser to be installed." + if not feedparser: + return rss + rss = feedparser.parse(rss) - # print rss -# for e in rss.entries: print e;print - l = posts() + + posts = [] for e in rss.entries: if e.has_key("links") and e["links"]!=[] and e["links"][0].has_key("href"): url = e["links"][0]["href"] @@ -453,59 +484,147 @@ def dlcs_rss_request(tag = "", popular = 0, user = "", url = ''): # die benennung der variablen ist nicht einheitlich # api senden und # xml bekommen sind zwei verschiedene schuhe :( - l.append(post(url = url, description = description, tags = tags, dt = dt, extended = extended, user = user)) - return l + posts.append({'url':url, 'description':description, 'tags':tags, + 'dt':dt, 'extended':extended, 'user':user}) + return posts + + +delicious_v2_feeds = { + #"Bookmarks from the hotlist" + '': "%(format)s", + #"Recent bookmarks" + 'recent': "%(format)s/recent", + #"Recent bookmarks by tag" + 'tagged': "%(format)s/tag/%(tags)s", + #"Popular bookmarks" + 'popular': "%(format)s/popular", + #"Popular bookmarks by tag" + 'popular_tagged': "%(format)s/popular/%(tag)s", + #"Recent site alerts (as seen in the top-of-page alert bar on the site)" + 'alerts': "%(format)s/alerts", + #"Bookmarks for a specific user" + 'user': "%(format)s/%(username)s", + #"Bookmarks for a specific user by tag(s)" + 'user_tagged': "%(format)s/%(username)s/%(tags)s", + #"Public summary information about a user (as seen in the network badge)" + 'user_info': "%(format)s/userinfo/%(username)s", + #"A list of all public tags for a user" + 'user_tags': "%(format)s/tags/%(username)s", + #"Bookmarks from a user's subscriptions" + 'user_subscription': "%(format)s/subscriptions/%(username)s", + #"Private feed for a user's inbox bookmarks from others" + 'user_inbox': "%(format)s/inbox/%(username)s?private=%(key)s", + #"Bookmarks from members of a user's network" + 'user_network': "%(format)s/network/%(username)s", + #"Bookmarks from members of a user's network by tag" + 'user_network_tagged': "%(format)s/network/%(username)s/%(tags)s", + #"A list of a user's network members" + 'user_network_member': "%(format)s/networkmembers/%(username)s", + #"A list of a user's network fans" + 'user_network_fan': "%(format)s/networkfans/%(username)s", + #"Recent bookmarks for a URL" + 'url': "%(format)s/url/%(urlmd5)s", + #"Summary information about a URL (as seen in the tagometer)" + 'urlinfo': "json/urlinfo/%(urlmd5)s", +} + +def dlcs_feed(name_or_url, url_map=delicious_v2_feeds, count=15, **params): + + """ + Request and parse a feed. See delicious_v2_feeds for available names and + required parameters. Format defaults to json. + """ + +# http://delicious.com/help/feeds +# TODO: plain or fancy + + format = params.setdefault('format', 'json') + if count == 'all': +# TODO: fetch all + print >>sys.stderr, "! Maxcount 100 " + count = 100 + + if name_or_url in url_map: + params['count'] = count + url = DLCS_FEEDS + url_map[name_or_url] % params + + else: + url = name_or_url + + if DEBUG: + print 'dlcs_feed', url + + feed = http_request(url).read() + + if format == 'rss': + if feedparser: + rss = feedparser.parse(feed) + return rss + + else: + return feed + + elif format == 'json': + return feed ### Main module class class DeliciousAPI: - """Class providing main interace to del.icio.us API. + + """A single-user Python facade to the del.icio.us HTTP API. + + See http://delicious.com/help/api. Methods ``request`` and ``request_raw`` represent the core. For all API paths there are furthermore methods (e.g. posts_add for 'posts/all') with - an explicit declaration of the parameters and documentation. These all call - ``request`` and pass on extra keywords like ``_raw``. + an explicit declaration of parameters and documentation. """ - def __init__(self, user, passwd, codec='iso-8859-1', api_request=dlcs_api_request, xml_parser=dlcs_parse_xml): - """Initialize access to the API with ``user`` and ``passwd``. + def __init__(self, user, passwd, codec=PREFERRED_ENCODING, + api_request=dlcs_api_request, xml_parser=dlcs_parse_xml, + build_opener=dlcs_api_opener, encode_params=dlcs_encode_params): + + """Initialize access to the API for ``user`` with ``passwd``. - ``codec`` sets the encoding of the arguments. + ``codec`` sets the encoding of the arguments, which defaults to the + users preferred locale. The ``api_request`` and ``xml_parser`` parameters by default point to - functions within this package with standard implementations to + functions within this package with standard implementations which request and parse a resource. See ``dlcs_api_request()`` and - ``dlcs_parse_xml()``. Note that ``api_request`` should return a - file-like instance with an HTTPMessage instance under ``info()``, - see ``urllib2.openurl`` for more info. + ``dlcs_parse_xml()``. + + Parameter ``build_opener`` is a callable that, provided with the + credentials, should build a urllib2 opener for the delicious API server + with HTTP authentication. See ``dlcs_api_opener()`` for the default + implementation. + + ``encode_params`` finally preprocesses API parameters before + they are passed to ``api_request``. """ + assert user != "" self.user = user self.passwd = passwd self.codec = codec # Implement communication to server and parsing of respons messages: + assert callable(encode_params) + self._encode_params = encode_params + assert callable(build_opener) + self._opener = build_opener(user, passwd) assert callable(api_request) self._api_request = api_request assert callable(xml_parser) self._parse_response = xml_parser - def _call_server(self, path, **params): - params = dict0(params) - for key in params: - params[key] = params[key].encode(self.codec) - - # see __init__ for _api_request() - return self._api_request(path, params, self.user, self.passwd) - - ### Core functionality def request(self, path, _raw=False, **params): - """Calls a path in the API, parses the answer to a JSON-like structure by - default. Use with ``_raw=True`` or ``call request_raw()`` directly to - get the filehandler and process the response message manually. + """Sends a request message to `path` in the API, and parses the results + from XML. Use with ``_raw=True`` or ``call request_raw()`` directly + to get the filehandler and process the response message manually. Calls to some paths will return a `result` message, i.e.:: @@ -515,46 +634,56 @@ class DeliciousAPI: <result>...</result> - These are all parsed to ``{'result':(Boolean, MessageString)}`` and this - method will raise ``DeliciousError`` on negative `result` answers. Using - ``_raw=True`` bypasses all parsing and will never raise ``DeliciousError``. + These should all be parsed to ``{'result':(Boolean, MessageString)}``, + this method raises a ``DeliciousError`` on negative `result` answers. + Positive answers are silently accepted and nothing is returned. + + Using ``_raw=True`` bypasses all parsing and never raises + ``DeliciousError``. See ``dlcs_parse_xml()`` and ``self.request_raw()``.""" - # method _parse_response is bound in `__init__()`, `_call_server` - # uses `_api_request` also set in `__init__()` if _raw: # return answer return self.request_raw(path, **params) else: + params = self._encode_params(params, self.codec) + # get answer and parse - fl = self._call_server(path, **params) + fl = self._api_request(path, params=params, opener=self._opener) rs = self._parse_response(fl) - # Raise an error for negative 'result' answers - if type(rs) == dict and rs == 'result' and not rs['result'][0]: - errmsg = "" - if len(rs['result'])>0: - errmsg = rs['result'][1:] - raise DeliciousError, errmsg + if type(rs) == dict and 'result' in rs: + if not rs['result'][0]: + # Raise an error for negative 'result' answers + errmsg = "" + if len(rs['result'])>0: + errmsg = rs['result'][1] + DeliciousError.raiseFor(errmsg, path, **params) + + else: + # not out-of-the-oridinary result, OK + return return rs def request_raw(self, path, **params): - """Calls the path in the API, returns the filehandle. Returned - file-like instances have an ``HTTPMessage`` instance with HTTP header + """Calls the path in the API, returns the filehandle. Returned file- + like instances have an ``HTTPMessage`` instance with HTTP header information available. Use ``filehandle.info()`` or refer to the ``urllib2.openurl`` documentation. """ # see `request()` on how the response can be handled - return self._call_server(path, **params) + params = self._encode_params(params, self.codec) + return self._api_request(path, params=params, opener=self._opener) ### Explicit declarations of API paths, their parameters and docs # Tags def tags_get(self, **kwds): - """Returns a list of tags and the number of times it is used by the user. + """Returns a list of tags and the number of times it is used by the + user. :: <tags> @@ -562,14 +691,22 @@ class DeliciousAPI: """ return self.request("tags/get", **kwds) + def tags_delete(self, tag, **kwds): + """Delete an existing tag. + + &tag={TAG} + (required) Tag to delete + """ + return self.request('tags/delete', tag=tag, **kwds) + def tags_rename(self, old, new, **kwds): """Rename an existing tag with a new tag name. Returns a `result` message or raises an ``DeliciousError``. See ``self.request()``. - &old (required) - Tag to rename. - &new (required) - New name. + &old={TAG} + (required) Tag to rename. + &new={TAG} + (required) New tag name. """ return self.request("tags/rename", old=old, new=new, **kwds) @@ -590,12 +727,12 @@ class DeliciousAPI: <dates> <date date="CCYY-MM-DD" count="888"> - &tag (optional). - Filter by this tag. + &tag={TAG} + (optional) Filter by this tag """ return self.request("posts/dates", tag=tag, **kwds) - def posts_get(self, tag="", dt="", url="", **kwds): + def posts_get(self, tag="", dt="", url="", hashes=[], meta=True, **kwds): """Returns posts matching the arguments. If no date or url is given, most recent date will be used. :: @@ -603,14 +740,25 @@ class DeliciousAPI: <posts dt="CCYY-MM-DD" tag="..." user="..."> <post ...> - &tag (optional). - Filter by this tag. - &dt (optional). - Filter by this date (CCYY-MM-DDThh:mm:ssZ). - &url (optional). - Filter by this url. + &tag={TAG} {TAG} ... {TAG} + (optional) Filter by this/these tag(s). + &dt={CCYY-MM-DDThh:mm:ssZ} + (optional) Filter by this date, defaults to the most recent date on + which bookmarks were saved. + &url={URL} + (optional) Fetch a bookmark for this URL, regardless of date. + &hashes={MD5} {MD5} ... {MD5} + (optional) Fetch multiple bookmarks by one or more URL MD5s + regardless of date. + &meta=yes + (optional) Include change detection signatures on each item in a + 'meta' attribute. Clients wishing to maintain a synchronized local + store of bookmarks should retain the value of this attribute - its + value will change when any significant field of the bookmark + changes. """ - return self.request("posts/get", tag=tag, dt=dt, url=url, **kwds) + return self.request("posts/get", tag=tag, dt=dt, url=url, + hashes=hashes, meta=meta, **kwds) def posts_recent(self, tag="", count="", **kwds): """Returns a list of the most recent posts, filtered by argument. @@ -619,14 +767,15 @@ class DeliciousAPI: <posts tag="..." user="..."> <post ...> - &tag (optional). - Filter by this tag. - &count (optional). - Number of items to retrieve (Default:15, Maximum:100). + &tag={TAG} + (optional) Filter by this tag. + &count={1..100} + (optional) Number of items to retrieve (Default:15, Maximum:100). """ return self.request("posts/recent", tag=tag, count=count, **kwds) - def posts_all(self, tag="", **kwds): + def posts_all(self, tag="", start=None, results=None, fromdt=None, + todt=None, meta=True, hashes=False, **kwds): """Returns all posts. Please use sparingly. Call the `posts_update` method to see if you need to fetch this at all. :: @@ -634,13 +783,34 @@ class DeliciousAPI: <posts tag="..." user="..." update="CCYY-MM-DDThh:mm:ssZ"> <post ...> - &tag (optional). - Filter by this tag. + &tag + (optional) Filter by this tag. + &start={#} + (optional) Start returning posts this many results into the set. + &results={#} + (optional) Return this many results. + &fromdt={CCYY-MM-DDThh:mm:ssZ} + (optional) Filter for posts on this date or later + &todt={CCYY-MM-DDThh:mm:ssZ} + (optional) Filter for posts on this date or earlier + &meta=yes + (optional) Include change detection signatures on each item in a + 'meta' attribute. Clients wishing to maintain a synchronized local + store of bookmarks should retain the value of this attribute - its + value will change when any significant field of the bookmark + changes. + &hashes + (optional, exclusive) Do not fetch post details but a posts + manifest with url- and meta-hashes. Other options do not apply. """ - return self.request("posts/all", tag=tag, **kwds) + if hashes: + return self.request("posts/all", hashes=hashes, **kwds) + else: + return self.request("posts/all", tag=tag, fromdt=fromdt, todt=todt, + start=start, results=results, meta=meta, **kwds) def posts_add(self, url, description, extended="", tags="", dt="", - replace="no", shared="yes", **kwds): + replace=False, shared=True, **kwds): """Add a post to del.icio.us. Returns a `result` message or raises an ``DeliciousError``. See ``self.request()``. @@ -654,10 +824,12 @@ class DeliciousAPI: tags for the item (space delimited). &dt (optional) datestamp of the item (format "CCYY-MM-DDThh:mm:ssZ"). - - Requires a LITERAL "T" and "Z" like in ISO8601 at http://www.cl.cam.ac.uk/~mgk25/iso-time.html for example: "1984-09-01T14:21:31Z" - &replace=no (optional) - don't replace post if given url has already been posted. - &shared=no (optional) - make the item private + Requires a LITERAL "T" and "Z" like in ISO8601 at + http://www.cl.cam.ac.uk/~mgk25/iso-time.html for example: + "1984-09-01T14:21:31Z" + &replace=no (optional) - don't replace post if given url has already + been posted. + &shared=yes (optional) - wether the item is public. """ return self.request("posts/add", url=url, description=description, extended=extended, tags=tags, dt=dt, @@ -690,7 +862,7 @@ class DeliciousAPI: &bundle (required) the bundle name. &tags (required) - list of tags (space seperated). + list of tags. """ if type(tags)==list: tags = " ".join(tags) @@ -710,19 +882,22 @@ class DeliciousAPI: # Lookup table for del.icio.us url-path to DeliciousAPI method. paths = { - 'tags/get': tags_get, - 'tags/rename': tags_rename, - 'posts/update': posts_update, - 'posts/dates': posts_dates, - 'posts/get': posts_get, - 'posts/recent': posts_recent, - 'posts/all': posts_all, - 'posts/add': posts_add, - 'posts/delete': posts_delete, - 'tags/bundles/all': bundles_all, - 'tags/bundles/set': bundles_set, - 'tags/bundles/delete': bundles_delete, + 'tags/get': 'tags_get', + 'tags/delete': 'tags_delete', + 'tags/rename': 'tags_rename', + 'posts/update': 'posts_update', + 'posts/dates': 'posts_dates', + 'posts/get': 'posts_get', + 'posts/recent': 'posts_recent', + 'posts/all': 'posts_all', + 'posts/add': 'posts_add', + 'posts/delete': 'posts_delete', + 'tags/bundles/all': 'bundles_all', + 'tags/bundles/set': 'bundles_set', + 'tags/bundles/delete': 'bundles_delete', } + def get_method(self, path): + return getattr(self, self.paths[path]) def get_url(self, url): """Return the del.icio.us url at which the HTML page with posts for @@ -730,41 +905,55 @@ class DeliciousAPI: """ return "http://del.icio.us/url/?url=%s" % (url,) + def __repr__(self): + return "DeliciousAPI(%s)" % self.user + ### Convenience functions on this package def apiNew(user, passwd): - """creates a new DeliciousAPI object. - requires user(name) and passwd - """ + "Creates a new DeliciousAPI object, requires user(name) and passwd." return DeliciousAPI(user=user, passwd=passwd) -def add(user, passwd, url, description, tags="", extended="", dt="", replace="no"): - return apiNew(user, passwd).posts_add(url=url, description=description, extended=extended, tags=tags, dt=dt, replace=replace) +def add(user, passwd, url, description, tags="", extended="", dt=None, + replace=False): + apiNew(user, passwd).posts_add(url=url, description=description, + extended=extended, tags=tags, dt=dt, replace=replace) -def get(user, passwd, tag="", dt="", count = 0): - posts = apiNew(user, passwd).posts_get(tag=tag,dt=dt) - if count != 0: posts = posts[0:count] +def get(user, passwd, tag="", dt=None, count=0, hashes=[]): + "Returns a list of posts for the user" + posts = apiNew(user, passwd).posts_get( + tag=tag, dt=dt, hashes=hashes)['posts'] + if count: posts = posts[:count] return posts -def get_all(user, passwd, tag=""): - return apiNew(user, passwd).posts_all(tag=tag) +def get_update(user, passwd): + "Returns the last update time for the user." + return apiNew(user, passwd).posts_update()['update']['time'] + +def get_all(user, passwd, tag="", start=0, results=100, fromdt=None, + todt=None): + "Returns a list with all posts. Please use sparingly. See `get_updated`" + return apiNew(user, passwd).posts_all(tag=tag, start=start, + results=results, fromdt=fromdt, todt=todt, meta=True)['posts'] + +def get_tags(user, passwd): + "Returns a list with all tags for user." + return apiNew(user=user, passwd=passwd).tags_get()['tags'] def delete(user, passwd, url): - return apiNew(user, passwd).posts_delete(url=url) + "Delete the URL from the del.icio.us account." + apiNew(user, passwd).posts_delete(url=url) def rename_tag(user, passwd, oldtag, newtag): - return apiNew(user=user, passwd=passwd).tags_rename(old=oldtag, new=newtag) + "Rename the tag for the del.icio.us account." + apiNew(user=user, passwd=passwd).tags_rename(old=oldtag, new=newtag) -def get_tags(user, passwd): - return apiNew(user=user, passwd=passwd).tags_get() +### RSS functions -### RSS functions bvb: still working...? def getrss(tag="", popular=0, url='', user=""): - """get posts from del.icio.us via parsing RSS (bvb:or HTML) - - todo: not tested + """Get posts from del.icio.us via parsing RSS. tag (opt) sort by tag popular (opt) look for the popular stuff @@ -774,44 +963,83 @@ def getrss(tag="", popular=0, url='', user=""): return dlcs_rss_request(tag=tag, popular=popular, user=user, url=url) def get_userposts(user): - return getrss(user = user) + "parse RSS for user" + return getrss(user=user) def get_tagposts(tag): - return getrss(tag = tag) + "parse RSS for tag" + return getrss(tag=tag) def get_urlposts(url): - return getrss(url = url) + "parse RSS for URL" + return getrss(url=url) + +def get_popular(tag=""): + "parse RSS for popular URLS for tag" + return getrss(tag=tag, popular=1) -def get_popular(tag = ""): - return getrss(tag = tag, popular = 1) +### JSON feeds +# TODO: untested -### TODO: implement JSON fetching -def json_posts(user, count=15): - """http://del.icio.us/feeds/json/mpe - http://del.icio.us/feeds/json/mpe/art+history - count=### the number of posts you want to get (default is 15, maximum is 100) - raw a raw JSON object is returned, instead of an object named Delicious.posts +def json_posts(user, count=15, tag=None, raw=True): """ + user + count=### the number of posts you want to get (default is 15, maximum + is 100) + raw a raw JSON object is returned, instead of an object named + Delicious.posts + """ + url = "http://del.icio.us/feeds/json/" + \ + dlcs_encode_params({0:user})[0] + if tag: url += '/'+dlcs_encode_params({0:tag})[0] + + return dlcs_feed(url, count=count, raw=raw) -def json_tags(user, atleast, count, sort='alpha'): - """http://del.icio.us/feeds/json/tags/mpe - atleast=### include only tags for which there are at least ### number of posts - count=### include ### tags, counting down from the top - sort={alpha|count} construct the object with tags in alphabetic order (alpha), or by count of posts (count) - callback=NAME wrap the object definition in a function call NAME(...), thus invoking that function when the feed is executed - raw a pure JSON object is returned, instead of code that will construct an object named Delicious.tags + +def json_tags(user, atleast, count, sort='alpha', raw=True, callback=None): + """ + user + atleast=### include only tags for which there are at least ### + number of posts. + count=### include ### tags, counting down from the top. + sort={alpha|count} construct the object with tags in alphabetic order + (alpha), or by count of posts (count). + callback=NAME wrap the object definition in a function call NAME(...), + thus invoking that function when the feed is executed. + raw a pure JSON object is returned, instead of code that + will construct an object named Delicious.tags. """ + url = 'http://del.icio.us/feeds/json/tags/' + \ + dlcs_encode_params({0:user})[0] + return dlcs_feed(url, atleast=atleast, count=count, sort=sort, raw=raw, + callback=callback) -def json_network(user): - """http://del.icio.us/feeds/json/network/mpe + +def json_network(user, raw=True, callback=None): + """ callback=NAME wrap the object definition in a function call NAME(...) - ?raw a raw JSON object is returned, instead of an object named Delicious.posts + ?raw a raw JSON object is returned, instead of an object named + Delicious.posts """ + url = 'http://del.icio.us/feeds/json/network/' + \ + dlcs_encode_params({0:user})[0] + return dlcs_feed(url, raw=raw, callback=callback) -def json_fans(user): - """http://del.icio.us/feeds/json/fans/mpe + +def json_fans(user, raw=True, callback=None): + """ callback=NAME wrap the object definition in a function call NAME(...) - ?raw a pure JSON object is returned, instead of an object named Delicious. + ?raw a pure JSON object is returned, instead of an object named + Delicious. """ + url = 'http://del.icio.us/feeds/json/fans/' + \ + dlcs_encode_params({0:user})[0] + return dlcs_feed(url, raw=raw, callback=callback) + + +### delicious V2 feeds + +def getfeed(name, **params): + return dlcs_feed(name, **params) |