import numpy as np
import pandas as pd
df = pd.DataFrame([[np.nan, 'f+2', np.nan, '0'],
['3', '4', np.nan, 'y1,et'],
[np.nan, np.nan, np.nan, np.nan],
[np.nan, '3', np.nan, 'w$4q']],
columns=list("ABCD"))
print(df)
df.replace(to_replace=r'[a-zA-Z+$,]', value='', inplace=True, regex=True)
print(df)
df = df.fillna(0.0)
df = df.astype(float)
print(df)
A B C D
0 NaN f+2 NaN 0
1 3 4 NaN y1,et
2 NaN NaN NaN NaN
3 NaN 3 NaN w$4q
A B C D
0 NaN 2 NaN 0
1 3 4 NaN 1
2 NaN NaN NaN NaN
3 NaN 3 NaN 4
A B C D
0 0.0 2.0 0.0 0.0
1 3.0 4.0 0.0 1.0
2 0.0 0.0 0.0 0.0
3 0.0 3.0 0.0 4.0
Как запустить код на библиотеке selenium_stealth без монитора?
#!/usr/bin/env python
# -*- coding: utf-8 -*-
from selenium import webdriver
from selenium_stealth import stealth
import time
options = webdriver.ChromeOptions()
options.add_argument("start-maximized")
options.add_argument("--headless")
options.add_experimental_option("excludeSwitches", ["enable-automation"])
options.add_experimental_option('useAutomationExtension', False)
driver = webdriver.Chrome(options=options)
stealth(driver,
languages=["en-US", "en"],
vendor="Google Inc.",
platform="Win32",
webgl_vendor="Intel Inc.",
renderer="Intel Iris OpenGL Engine",
fix_hairline=True,
)
url = "https://bot.sannysoft.com/"
driver.get(url)
time.sleep(5)
driver.quit()
$ chromedriver --version
ChromeDriver 99.0.4844.51 (d537ec02474b5afe23684e7963d538896c63ac77-refs/branch-heads/4844@{#875})
$ google-chrome-stable --version
Google Chrome 99.0.4844.51
#!/usr/bin/env bash
while IFS= read -r -d '' file; do
file_name=$(basename "$file" | cut -d "." -f 1)
target_dir="/config/rec/$file_name"
mkdir -p "$target_dir"
cp "$file" "$target_dir"
rclone copy "$target_dir" cloud: --max-age 12h --create-empty-src-dirs -P --transfers=1 --checkers=1;
done < <(find "$DIR" -name "*.mp4" -print0)
rclone
я не пользуюсь, так что сами проверьте эту часть. import time
from selenium import webdriver
from selenium.webdriver.chrome.options import Options
from bs4 import BeautifulSoup
options = Options()
options.headless = True
driver = webdriver.Chrome(options=options)
URL = 'https://eth.nanopool.org/'
driver.get(URL)
html = driver.page_source
time.sleep(5)
soup = BeautifulSoup(html, 'lxml')
data = soup.find_all('div', class_='panel panel-primary fixed-height-panel')
for elem in data:
elem_title = elem.find('div', class_='panel-title').text
elem_value = elem.find('div', class_='panel-body').text
print(f'{elem_title}: {elem_value}')
Result: near "BETWEEN": syntax error
from bs4 import BeautifulSoup
DOC = '''
<html>
<body>
<div>
<p class="1">
<label>Значение, которое нужно спарсить</label>
</div>
<div>
<p class="2">
<label>Значение, которое мне не нужно</label>
</div>
<div>
<p class="1">
<label>Ещё одно значение, которое нужно спарсить</label>
</div>
</body>
</html>
'''
soup = BeautifulSoup(DOC, 'lxml')
for par in soup.find_all('p', class_='1'):
label = par.find_parent('div').find('label')
print(label.text)