asyncio native version (pre unsync)

mikeckennedy · mikeckennedy · commit 059eba2a5435 · 2019-10-20T11:35:45.000-07:00
diff --git a/apps/py/ch10_async/ascrape.py b/apps/py/ch10_async/ascrape.py
@@ -2,23 +2,30 @@
 import httpx
 import bs4
 import datetime
+import asyncio
+
+loop = asyncio.get_event_loop()
 
 
 def main():
     print("Python async web scraper")
 
     t0 = datetime.datetime.now()
-    get_titles()
+    loop.run_until_complete(get_titles())
     dt = datetime.datetime.now() - t0
     print(f"Finished in {dt.total_seconds():,.2f} seconds.")
 
+    loop.close()
+
 
-def get_html(n: int) -> str:
+async def get_html(n: int) -> str:
     print(Fore.YELLOW + f"Getting HTML for episode {n}...", flush=True)
     url = f'https://talkpython.fm/{n}'
 
-    resp = httpx.get(url)
-    resp.raise_for_status()
+    # The "async with" syntax ensures that all active connections are closed on exit.
+    async with httpx.AsyncClient() as client:
+        resp = await client.get(url)
+        resp.raise_for_status()
 
     return resp.text
 
@@ -34,10 +41,24 @@ def get_title_from_html(n: int, html: str) -> str:
     return header.text.strip()
 
 
-def get_titles():
+# async def get_titles():
+#     for n in range(220, 231):
+#         html = await get_html(n)
+#         title = get_title_from_html(n, html)
+#         print(Fore.GREEN + title)
+
+
+async def get_titles():
+    tasks = []
     for n in range(220, 231):
-        html = get_html(n)
-        title = get_title_from_html(n, html)
+        task = loop.create_task(get_html(n))
+        episode = n
+
+        tasks.append((episode, task))
+
+    for episode, task in tasks:
+        html = await task
+        title = get_title_from_html(episode, html)
         print(Fore.GREEN + title)