diff --git a/1-Data-Cleaning.ipynb b/1-Data-Cleaning.ipynb index 2689063..24f3685 100644 --- a/1-Data-Cleaning.ipynb +++ b/1-Data-Cleaning.ipynb @@ -80,7 +80,9 @@ " '''Returns transcript data specifically from scrapsfromtheloft.com.'''\n", " page = requests.get(url).text\n", " soup = BeautifulSoup(page, \"lxml\")\n", - " text = [p.text for p in soup.find(class_=\"ast-container\").find_all('p')]\n", + " #text = [p.text for p in soup.find(class_=\"ast-container\").find_all('p')]\n", + " # page html code was modified this line of code can be formated like this\n", + " text = [p.text for p in soup.find_all('p')]\n", " print(url)\n", " return text\n", "\n",
Note: This service is not intended for secure transactions such as banking, social media, email, or purchasing. Use at your own risk. We assume no liability whatsoever for broken pages.
Alternative Proxies: