import urllib.request link = 'http://www.cs.virginia.edu/~cs1112/datasets/words/most-misspelled' stream = urllib.request.urlopen( link ) page = stream.read() text = page.decode( 'UTF-8' ) print( text )