plotdevice-libs/web/__init__.py at master · plotdevice/plotdevice-libs

110 lines (90 loc) · 3.64 KB
### CREDITS ##########################################################################################
# Copyright (c) 2008 Tom De Smedt.
# See LICENSE.txt for details.
__author__    = "Tom De Smedt"
__version__   = "1.9.4.5"
__copyright__ = "Copyright (c) 2008 Tom De Smedt"
__license__   = "GPL"
from plotdevice.lib import register
_ctx = register(__name__)
### NODEBOX WEB LIBRARY #############################################################################
# The NodeBox Web library offers a collection of services to retrieve content from the internet.
# You can use the library to query Yahoo! for links, images, news and spelling suggestions,
# to read RSS and Atom newsfeeds, to retrieve articles from Wikipedia, to collect quality images
# from morgueFile, to get color themes from kuler , to browse through HTML documents, to clean up HTML,
# to validate URL's, to create GIF images from math equations using mimeTeX, to get ironic word
# definitions from Urban Dictionary.
# The NodeBox Web library works with a caching mechanism that stores things you download from the web,
# so they can be retrieved faster the next time. Many of the services also work asynchronously.
# This means you can use the library in an animation that keeps on running while new content is downloaded
# in the background.
# The library bundles Leonard Richardson's BeautifulSoup to parse HTM,
# Mark Pilgrim's Universal Feed Parser for newsfeeds, a connection to John Forkosh's mimeTeX server,
# Leif K-Brooks entity replace algorithm, Bob Ippolito's simplejson.
######################################################################################################
from . import cache
from . import url
from . import html
from . import page
from . import json
packages = [
    "yahoo", "google",
    "newsfeed",
    "wikipedia",
    "morguefile", "flickr",
    "kuler", "colr",
    "mimetex", #deprecated
    "mathtex",
    "urbandictionary",
for p in packages:
    try: exec("import %s" % p)
    except ImportError:
        pass
def set_proxy(host, type="https"):
    url.set_proxy(host, type)
set_proxy(None)
def is_url(url_, wait=10):
    return url.is_url(url_, wait)
def download(url_, wait=60, cache=None, type=".html"):
    return url.retrieve(url_, wait, False, cache, type).data
def save(url_, path="", wait=60):
    if hasattr(url_, "url"):
        url_ = url_.url
    if len(path) < 5 or "." not in path[-5:-3]:
        file = url.parse(str(url_)).filename
        path = os.path.join(path, file)
    open(path, "w").write(download(url_, wait))
    return path
def clear_cache():
    page.clear_cache()
    for p in packages:
        try: exec("%s.clear_cache()" % p)
        except NameError:
            pass
# cache.py closes files after reading and writing.
# This is necessary in Jython.
# mathTeX deprecates mimeTeX.
# Flickr accepts Unicode queries.
# Added set_proxy() command.
# Added Serafeim Zanikolas' patches & examples for Debian.
# Added Serafeim Zanikolas' html=False attribute to WikipediaPage.
# Added simplejson for improved unicode support.
# Added google.py module.
# Improvements to html.py.
# Morguefile images can be filtered by size.
# Flickr images can be filtered by size.
# Flickr images can be filtered by interestingness/relevance/date/tags.
# Fixed Flickr unicode bug.
# Wikipedia unicode improvements.
# url.URLAccumulator._done() will only load data if no URLError was raised.
# url.parse() has a new .filename attribute (equals .page).
# Handy web.save() command downloads data and saves it to a given path.
# hex_to_rgb() improvement for hex strings shorter than 6 characters.
# Upgraded to BeautifulSoup 3.0.7a
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

__init__.py

Latest commit

History

__init__.py

File metadata and controls

init.py

init.py