summaryrefslogtreecommitdiff
path: root/plugin/readability/url_helpers.py
diff options
context:
space:
mode:
Diffstat (limited to 'plugin/readability/url_helpers.py')
-rwxr-xr-xplugin/readability/url_helpers.py52
1 files changed, 0 insertions, 52 deletions
diff --git a/plugin/readability/url_helpers.py b/plugin/readability/url_helpers.py
deleted file mode 100755
index 8234c8d..0000000
--- a/plugin/readability/url_helpers.py
+++ /dev/null
@@ -1,52 +0,0 @@
-import logging
-from urlparse import urlparse
-
-def host_for_url(url):
- """
- >>> host_for_url('http://base/whatever/fdsh')
- 'base'
- >>> host_for_url('invalid')
- """
- host = urlparse(url)[1]
- if not host:
- logging.error("could not extract host from URL: %r" % (url,))
- return None
- return host
-
-def absolute_url(url, base_href):
- """
- >>> absolute_url('foo', 'http://base/whatever/ooo/fdsh')
- 'http://base/whatever/ooo/foo'
-
- >>> absolute_url('foo/bar/', 'http://base')
- 'http://base/foo/bar/'
-
- >>> absolute_url('/foo/bar', 'http://base/whatever/fdskf')
- 'http://base/foo/bar'
-
- >>> absolute_url('\\n/foo/bar', 'http://base/whatever/fdskf')
- 'http://base/foo/bar'
-
- >>> absolute_url('http://localhost/foo', 'http://base/whatever/fdskf')
- 'http://localhost/foo'
- """
- url = url.strip()
- proto = urlparse(url)[0]
- if proto:
- return url
-
- base_url_parts = urlparse(base_href)
- base_server = '://'.join(base_url_parts[:2])
- if url.startswith('/'):
- return base_server + url
- else:
- path = base_url_parts[2]
- if '/' in path:
- path = path.rsplit('/', 1)[0] + '/'
- else:
- path = '/'
- return base_server + path + url
-
-if __name__ == '__main__':
- import doctest
- doctest.testmod() \ No newline at end of file