Origin: loosely based on upstream commit
68db2d26ddb5f95de4254d61b850d3dcaf6ce717
Author: patrick "phofl", Rebecca N. Palmer <rebecca_palmer@zoho.com>
Bug: https://github.com/pandas-dev/pandas/issues/38988
Bug-Debian: https://bugs.debian.org/979621
Forwarded: no
Gbp-Pq: Name 979621_dead_url.patch
.. ipython:: python
- url = 'https://www.fdic.gov/bank/individual/failed/banklist.html'
+ url = 'https://raw.githubusercontent.com/pandas-dev/pandas/master/pandas/tests/io/data/html/banklist.html'
dfs = pd.read_html(url)
dfs
-.. note::
-
- The data from the above URL changes every Monday so the resulting data above
- and the data below may be slightly different.
Read in the content of the file from the above URL and pass it to ``read_html``
as a string:
@tm.network
def test_banklist_url_positional_match(self):
- url = "http://www.fdic.gov/bank/individual/failed/banklist.html"
+ url = "https://raw.githubusercontent.com/pandas-dev/pandas/master/pandas/tests/io/data/html/banklist.html"
# Passing match argument as positional should cause a FutureWarning.
with tm.assert_produces_warning(FutureWarning):
df1 = self.read_html(
@tm.network
def test_banklist_url(self):
- url = "http://www.fdic.gov/bank/individual/failed/banklist.html"
+ url = "https://raw.githubusercontent.com/pandas-dev/pandas/master/pandas/tests/io/data/html/banklist.html"
df1 = self.read_html(
url, match="First Federal Bank of Florida", attrs={"id": "table"}
)