win32 paths cannot be turned into URLs by prefixing them with "file://"

see http://stackoverflow.com/questions/11687478/convert-a-filename-to-a-file-url
pandas-dev · mindw · Aug 16, 2013 · Aug 17, 2013 · Aug 23, 2013 · Aug 16, 2013
commit d64a0476c0d39ce173da97ffd4417484a413bf29
diff --git a/pandas/io/tests/test_html.py b/pandas/io/tests/test_html.py
@@ -27,6 +27,12 @@
 from pandas.util.testing import makeCustomDataframe as mkdf
 
 
+import urlparse, urllib
+
+def path2url(path):
+    return urlparse.urljoin(
+        'file:', urllib.pathname2url(path))
+
 def _have_module(module_name):
     try:
         import_module(module_name)
@@ -292,7 +298,7 @@ def test_bad_url_protocol(self):
     @slow
     def test_file_url(self):
         url = self.banklist_data
-        dfs = self.run_read_html('file://' + url, 'First',
+        dfs = self.run_read_html(path2url(url), 'First',
                                  attrs={'id': 'table'})
         self.assertIsInstance(dfs, list)
         for df in dfs:
@@ -338,7 +344,7 @@ def test_multiindex_header_index_skiprows(self):
     @slow
     def test_regex_idempotency(self):
         url = self.banklist_data
-        dfs = self.run_read_html('file://' + url,
+        dfs = self.run_read_html(path2url(url),
                                  match=re.compile(re.compile('Florida')),
                                  attrs={'id': 'table'})
         self.assertIsInstance(dfs, list)
@@ -464,7 +470,7 @@ def test_invalid_flavor():
 
 def get_elements_from_url(url, element='table', base_url="file://"):
     _skip_if_none_of(('bs4', 'html5lib'))
-    url = "".join([base_url, url])
+    url = path2url(url) if base_url == "file://" else "".join([base_url, url])
     from bs4 import BeautifulSoup
     with urlopen(url) as f:
         soup = BeautifulSoup(f, features='html5lib')