Инструменты пользователя

Инструменты сайта


python:parsers:proxy

Это старая версия документа!


proxy

import requests
from bs4 import BeautifulSoup
from random import choice
 
 
def get_proxy():
    html = requests.get('https://free-proxy-list.net/').text
    soup = BeautifulSoup(html, 'lxml')
 
    trs = soup.find('table', id='proxylisttable').find_all('tr')[1:13]
 
    proxies = []
 
    for tr in trs:
        tds = tr.find_all('td')
        ip = tds[0].text.strip()
        port = tds[1].text.strip()
        schema = 'https' if 'yes' in tds[6].text.strip() else 'http'
        proxy = {'schema': schema, 'address': ip + ':' + port}
        proxies.append(proxy)
    print(proxies)
    return choice(proxies)
 
 
def get_html(url):
    # proxies = {'https': 'ipaddress:5000'}
    p = get_proxy() # {'schema': '', 'address': ''}
 
    proxy = { p['schema']: p['address'] }
    #proxy = { 'http': '88.198.50.103:8080' }
 
    r = requests.get(url, proxies=proxy, timeout=5)
    return r.text
 
 
def main():
    url = 'http://httpbin.org/ip'
    print('Вы зашли с ip: '+get_html(url))
 
if __name__ == '__main__':
    main()
python/parsers/proxy.1585502549.txt.gz · Последние изменения: 2023/01/12 12:16 (внешнее изменение)