6 lat temu · eb104453c2
--- a/05_Page_views_eda.ipynb
+++ b/05_Page_views_eda.ipynb
--- a/solutions/page_view_eda.py
+++ b/solutions/page_view_eda.py
@@ -0,0 +1,17 @@
 
				+import operator
			
 
				+import urllib.parse
			
 
				+import pandas
			
 
				+
			
 
				+
			
 
				+page_views = pandas.read_parquet(PAGE_VIEWS_FNAME)
			
 
				+page_views.index = (page_views.index
			
 
				+                              .to_series()
			
 
				+                              .apply(urllib.parse.urlparse)
			
 
				+                              .apply(operator.attrgetter('path'))
			
 
				+                              .str.split('/')
			
 
				+                              .str[-1]
			
 
				+                              .str.rstrip('.html'))
			
 
				+
			
 
				+
			
 
				+docstring_errors = (pandas.read_hdf(DOCSTRING_ERRORS_FNAME)
			
 
				+                          .join(page_views.groupby('Page')['Pageviews'].sum()))