Created
March 18, 2024 13:20
-
-
Save dylanholmes/d6fc4b3ecd6182dcb2852e352434fa94 to your computer and use it in GitHub Desktop.
Scrape web page that fits into prompt context length
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
from dotenv import load_dotenv | |
from griptape.drivers import MarkdownifyWebScraperDriver | |
from griptape.structures import Agent | |
from griptape.loaders import WebLoader | |
from griptape.tools import WebScraper | |
load_dotenv() # take environment variables from .env. | |
url = "https://www.google.com/about/careers/applications/jobs/results#!t=jo&jid=127025001&" | |
agent = Agent( | |
tools=[ | |
WebScraper( | |
web_loader=WebLoader( | |
web_scraper_driver=MarkdownifyWebScraperDriver(), | |
), | |
off_prompt=False, | |
) | |
] | |
) | |
agent.run(f"Find all the job listings at {url}") | |
# Ouput: | |
# ```md | |
# Here are some of the job listings at Google: | |
# | |
# 1. Staff Software Engineer, Machine Learning, Core - New York, NY, USA; Sunnyvale, CA, USA; +4 more; +3 more | |
# 2. Security Engineering Manager, Product Security Engineering, Cloud CISO - Málaga, Spain | |
# 3. Staff Product Design Engineer, Tablets - Mountain View, CA, USA | |
# 4. New Business Account Strategist, Onboarding, Google Customer Solutions - New York, NY, USA | |
# 5. Cloud Customer Engineer, AI/ML - Cambridge, MA, USA; New York, NY, USA | |
# 6. Program Manager III, Supply Chain, Cloud Capacity Planning - Sunnyvale, CA, USA; Atlanta, GA, USA; +3 more; +2 more | |
# 7. Product Manager, Data Analytics and Business Intelligence - Hyderabad, Telangana, India | |
# 8. Lead CPU and Performance Architect - Austin, TX, USA; Mountain View, CA, USA; +2 more; +1 more | |
# 9. Head of Private Platforms and Anti-Covert Tracking, Privacy Sandbox - Mountain View, CA, USA; Atlanta, GA, USA; +11 more; +10 more | |
# 10. Director, Data Center Network Delivery - Sunnyvale, CA, USA | |
# | |
# Please note that this is just a selection of the jobs available. There are many more listed on the website. | |
# ``` |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment