Source code for tributary.streaming.input.http

import aiohttp
import asyncio
import json as JSON
from .input import Foo

[docs]class HTTP(Foo): '''Connect to url and yield results Args: url (str): url to connect to interval (int): interval to re-query repeat (int): number of times to request json (bool): load http content data as json wrap (bool): wrap result in a list field (str): field to index result by proxies (list): list of URL proxies to pass to requests.get cookies (list): list of cookies to pass to requests.get ''' def __init__(self, url, interval=1, repeat=1, json=False, wrap=False, field=None, proxies=None, cookies=None): async def _req(url=url, interval=interval, repeat=repeat, json=json, wrap=wrap, field=field, proxies=proxies, cookies=cookies): count = 0 if repeat >= 0 else float('-inf') # make less than anything while count < repeat: async with aiohttp.ClientSession() as session: async with session.get(url, cookies=cookies, proxy=proxies) as response: msg = await response.text() if msg is None or response.status != 200: break if json: msg = JSON.loads(msg) if field: msg = msg[field] if wrap: msg = [msg] yield msg if interval: await asyncio.sleep(interval) if repeat >= 0: count += 1 super().__init__(foo=_req) self._name = 'Http'