Open eswarketl opened 6 years ago
from bs4 import BeautifulSoup import pandas as pd from requests import get
url='http://www.imdb.com/search/title?release_date=2017&sort=num_votes,desc&page=1' response=get(url)
names = [] ratings = []
movie_def = pd.DataFrame({'movie':names,'ratings':ratings})
html_soup = BeautifulSoup(response.text, 'html.parser') type(html_soup)
movie_contains = html_soup.findall('div' ,class='lister-item mode-advanced') print(type(movie_contains)) print(len(movie_contains)) first_movie = movie_contains[0]
first_movie_name = first_movie.h3.a.text print(first_movie_name) first_movie_imdb = float(first_movie.strong.text) print(first_movie_imdb) print
for contains in moviecontains: if contains.find('div' ,class='ratings_metascore') is not None: name=contains.h3.a.text names.append(name) rating = contains.strong.text ratings.append(rating)
movie_def = pd.DataFrame({'movie':names,'ratings':ratings}) print(movie_def.info()) print(movie_def)
wasn't it the same code that we checked the other day?
import urllib, urllib2
from bs4 import BeautifulSoup import pandas as pd from requests import get
url="https://www.reddit.com/r/gameofthrones/"
url='http://www.imdb.com/search/title?release_date=2017&sort=num_votes,desc&page=1' response=get(url)
content = urllib2.urlopen(url).read()
print(content)
print(response.text[:100000000])
names = [] ratings = []
movie_def = pd.DataFrame({'movie':names,'ratings':ratings})
html_soup = BeautifulSoup(response.text, 'html.parser') type(html_soup)
movie_contains = html_soup.findall('div' ,class='lister-item mode-advanced') print(type(movie_contains)) print(len(movie_contains)) first_movie = movie_contains[0]
first_movie_name = first_movie.h3.a.text print(first_movie_name) first_movie_imdb = float(first_movie.strong.text) print(first_movie_imdb) print
for contains in moviecontains: if contains.find('div' ,class='ratings_metascore') is not None: name=contains.h3.a.text names.append(name) rating = contains.strong.text ratings.append(rating)
movie_def = pd.DataFrame({'movie':names,'ratings':ratings}) print(movie_def.info()) print(movie_def)