xxxxxxxxxx
pip install beautifulsoup4
# pip install google
from googlesearch import search
query = "what is a computer"
for result in search(query, num=20, stop=10):
print(result)
xxxxxxxxxx
try:
from googlesearch import search
except ImportError:
print("No module named 'google' found")
# to search
query = "Geeksforgeeks"
for j in search(query, tld="co.in", num=10, stop=10, pause=2):
print(j)
xxxxxxxxxx
{
2
3 // Launching a new browser instance
4 const browser = await chromium.launch({
5 headless: true
6 });
7
8 // Opening a new page
9 const page = await browser.newPage();
10
11 // Block unnecessary resources (images, stylesheets, fonts)
12 await page.route("**/*", route => {
13
14 const url = route.request().url();
15
16 if (url.endsWith(".png") || url.endsWith(".jpg") || url.endsWith(".jpeg") || url.endsWith(".gif") ||
17
18 url.endsWith(".css") || url.endsWith(".woff") || url.endsWith(".woff2") || url.endsWith(".ttf")) {
19
20 route.abort();
21
22 } else {
23 route.continue();
24 }
25
26 });
27
28 // Navigate to the target URL
29 await page.goto("https://browserless.io/");
30 console.log("Page loaded");
31
32 // Perform any scraping tasks
33 const data = await page.evaluate(() => {
34
35 return document.title;
36
37 });
38
39 console.log(`Page title: ${data}`);
40
41 // Closing the page
42 await page.close();
43
44 console.log("Page closed");
45
46 // Closing the browser instance
47 await browser.close();
48
49 console.log("Browser closed");
50
51})();
COPY