|
import os |
|
from selenium import webdriver |
|
from selenium.webdriver.common.by import By |
|
from selenium.webdriver.common.keys import Keys |
|
from selenium.webdriver.support.ui import WebDriverWait |
|
from selenium.webdriver.support import expected_conditions as EC |
|
from selenium.webdriver.chrome.options import Options |
|
from selenium.webdriver.chrome.service import Service |
|
import requests |
|
import time |
|
|
|
count=4 |
|
|
|
def openDataset(user_prompt): |
|
chrome_options = Options() |
|
chrome_options.add_argument("--headless") |
|
driver = webdriver.Chrome(options=chrome_options) |
|
try: |
|
driver.get('https://www.openml.org/search?type=data&status=active') |
|
|
|
time.sleep(5) |
|
|
|
search = WebDriverWait(driver, 20).until( |
|
EC.presence_of_element_located((By.CSS_SELECTOR, "input.MuiInputBase-input.css-mnn31"))) |
|
search.send_keys(user_prompt) |
|
search.send_keys(Keys.RETURN) |
|
time.sleep(4) |
|
|
|
divs = driver.find_elements(By.CSS_SELECTOR, "div.MuiPaper-root.MuiPaper-elevation.MuiPaper-elevation1.MuiCard-root.sc-gFAWRd.gJoEXx.css-1xol7fw") |
|
a=0 |
|
urls=[] |
|
for div in divs: |
|
a+=1 |
|
if a>count: |
|
break |
|
div.click() |
|
urls.append(driver.current_url) |
|
|
|
driver.back() |
|
time.sleep(2) |
|
|
|
driver.quit() |
|
return urls |
|
except: |
|
print("Internet Issue driver crashed") |
|
return [] |
|
|
|
|
|
|