diff --git a/README.md b/README.md index d8f76f90..eb0a6308 100644 --- a/README.md +++ b/README.md @@ -108,7 +108,7 @@ class NullAgentRunner(AgentRunner): - `--headless`: Run with Playwright headless mode - `-id` or `--id`: Run a specific test by id - `-i` or `--intent`: Only run tests of a particular intent (fetch, links, etc) -- `-d` or `--domain`: Only run tests of a particular domain (healthcare, manufacturing, software, etc) +- `-c` or `--category`: Only run tests of a particular category (healthcare, manufacturing, software, etc) - `-n` or `--n`: Number of test workers to use. The default is 1 - `-skip` or `--skip`: A list of ids to skip tests on, separated by commas - `-t` or `--type`: Only run tests of a particular type (links, fetch, etc) diff --git a/bananalyzer/__main__.py b/bananalyzer/__main__.py index 7db02627..0c804592 100644 --- a/bananalyzer/__main__.py +++ b/bananalyzer/__main__.py @@ -8,6 +8,7 @@ import sys from pathlib import Path from typing import List +from urllib.parse import urlparse from bananalyzer import AgentRunner from bananalyzer.data.examples import ( @@ -66,6 +67,13 @@ def parse_args() -> Args: default=None, help="Filter tests by id", ) + parser.add_argument( + "-d", + "--domain", + type=str, + default=None, + help="Filter tests by a particular URL domain", + ) parser.add_argument( "-i", "--intent", @@ -74,17 +82,17 @@ def parse_args() -> Args: help="Filter tests by a particular intent", ) parser.add_argument( - "-d", - "--domain", + "-c", + "--category", type=str, default=None, - help="Filter tests by a particular domain", + help="Filter tests by a particular category", ) parser.add_argument( - "--subdomain", + "--subcategory", type=str, default=None, - help="Filter tests by a particular domain", + help="Filter tests by a particular category", ) parser.add_argument( "-n", @@ -142,7 +150,8 @@ def parse_args() -> Args: intent=args.intent, id=args.id, domain=args.domain, - subdomain=args.subdomain, + category=args.category, + subcategory=args.subcategory, skip=args.skip, single_browser_instance=args.single_browser_instance, type=args.type, @@ -243,7 +252,15 @@ def main() -> int: ] if args.domain: filtered_examples = [ - example for example in filtered_examples if example.domain == args.domain + example + for example in filtered_examples + if ".".join(urlparse(example.url).netloc.split(".")[-2:]) == args.domain + ] + if args.category: + filtered_examples = [ + example + for example in filtered_examples + if example.category == args.category ] if args.skip: filtered_examples = [ @@ -253,11 +270,11 @@ def main() -> int: filtered_examples = [ example for example in filtered_examples if example.type in args.type ] - if args.subdomain: + if args.subcategory: filtered_examples = [ example for example in filtered_examples - if example.subdomain in args.subdomain + if example.subcategory in args.subcategory ] # Test we actually have tests to run diff --git a/bananalyzer/data/schemas.py b/bananalyzer/data/schemas.py index 0db848db..c30c158a 100644 --- a/bananalyzer/data/schemas.py +++ b/bananalyzer/data/schemas.py @@ -59,8 +59,8 @@ class Example(BaseModel): source: Literal["mhtml", "hosted", "url"] = Field( description="Source of the website" ) - domain: str = Field(description="Domain of the website") - subdomain: str = Field(description="Subdomain of the website") + category: str = Field(description="Category of the website") + subcategory: str = Field(description="Subcategory of the website") type: GoalType = Field( description="The high level goal intent the agent is aiming to do" ) diff --git a/bananalyzer/schema.py b/bananalyzer/schema.py index 514fae86..89883040 100644 --- a/bananalyzer/schema.py +++ b/bananalyzer/schema.py @@ -16,9 +16,10 @@ class Args(BaseModel): headless: bool single_browser_instance: bool id: Optional[str] = Field(default=None) - intent: Optional[GoalType] = Field(default=None) domain: Optional[str] = Field(default=None) - subdomain: Optional[str] = Field(default=None) + intent: Optional[GoalType] = Field(default=None) + category: Optional[str] = Field(default=None) + subcategory: Optional[str] = Field(default=None) skip: List[str] type: Optional[str] = Field(default=None) download: bool diff --git a/fetch.ipynb b/fetch.ipynb index 8ec92dbd..8c8741f1 100644 --- a/fetch.ipynb +++ b/fetch.ipynb @@ -99,8 +99,8 @@ "# \"id\": str(uuid.uuid4()),\n", "# \"url\": desired_url,\n", "# \"source\": \"mhtml\",\n", - "# \"domain\": \"UPDATE\",\n", - "# \"subdomain\": \"UPDATE\",\n", + "# \"category\": \"UPDATE\",\n", + "# \"subcategory\": \"UPDATE\",\n", "# \"type\": \"fetch\",\n", "# \"goal\": {},\n", "# \"evals\": [\n", @@ -114,8 +114,8 @@ " \"id\": str(uuid.uuid4()),\n", " \"url\": desired_url,\n", " \"source\": \"mhtml\",\n", - " \"domain\": \"healthcare\",\n", - " \"subdomain\": \"contact\",\n", + " \"category\": \"healthcare\",\n", + " \"subcategory\": \"contact\",\n", " \"type\": \"links\",\n", " \"goal\": \"Fetch all of the links to the detail pages of clinics on the current page\",\n", " \"evals\": [{\"type\": \"json_match\", \"expected\": {}}],\n", diff --git a/pyproject.toml b/pyproject.toml index 03061063..914e1b1f 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [tool.poetry] name = "bananalyzer" -version = "0.6.10" +version = "0.6.11" description = "Open source AI Agent evaluation framework for web tasks 🐒🍌" authors = ["asim-shrestha "] diff --git a/static/examples.json b/static/examples.json index 17ca2728..01619758 100644 --- a/static/examples.json +++ b/static/examples.json @@ -3,8 +3,8 @@ "id": "c5e7ec4b-ad83-49a5-b056-a37ddf974a64", "url": "https://www.mindstix.com/careers/machine-learning.html", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -30,8 +30,8 @@ "id": "8366209e-e5fb-4f64-85e0-79cd90985b59", "url": "https://www.amazon.jobs/en/jobs/2482000/software-development-engineer-amazon-access", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -57,8 +57,8 @@ "id": "6152ba56-e62b-42d1-beec-6ecac1dfec35", "url": "https://openai.com/careers/software-engineer-fullstack", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -84,8 +84,8 @@ "id": "d86e052f-3c14-4b4d-95e7-c26d59b771f7", "url": "https://www.metacareers.com/jobs/271783205502889/", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -111,8 +111,8 @@ "id": "4310caaa-bf1b-4704-9362-dbf5b961972d", "url": "https://c3.ai/job-description/?gh_jid=6181786002", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -138,8 +138,8 @@ "id": "ad142573-4dcb-4c1e-9a4d-6fa1fa818026", "url": "https://jobs.careers.microsoft.com/global/en/job/1658879/Software-Engineering-II", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -165,8 +165,8 @@ "id": "69a755f1-33db-4f77-9b8e-0e90cf7c7188", "url": "https://vercel.com/careers/technical-consultant-us-4930025004", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -192,8 +192,8 @@ "id": "f8e6ac9d-584d-4321-9451-7ebe0af3b6cb", "url": "https://www.ycombinator.com/careers?ashby_jid=05682b47-a5e2-4003-a9b8-b967cf45dd48", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -219,8 +219,8 @@ "id": "766abf53-e055-4e4d-ac42-531e74606846", "url": "https://jobs.lever.co/Anthropic/2786d360-13e0-4ad2-bef1-a193cd6a1f67", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -246,8 +246,8 @@ "id": "9a10af79-08e2-4d73-a2a1-675bb97126bb", "url": "https://boards.greenhouse.io/reddit/jobs/5245144", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -273,8 +273,8 @@ "id": "77d6efb9-2581-4f5f-a681-1b94696d9044", "url": "https://ouryahoo.wd5.myworkdayjobs.com/careers/job/Taiwan---Remote/Backend-Engineer--Media_JR0023180", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -300,8 +300,8 @@ "id": "5db440aa-f155-4297-bae4-769c8c808acd", "url": "https://jobs.apple.com/en-us/details/200517170/engineering-manager-camera-foundation?team=SFTWR", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -327,8 +327,8 @@ "id": "cc29229c-30f6-4a03-a4b6-2755ed0cca14", "url": "https://www.workatastartup.com/jobs/62396?utm_campaign=google_jobs_apply&utm_source=google_jobs_apply&utm_medium=organic", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -354,8 +354,8 @@ "id": "6535b75f-be1e-4f68-aedd-f3ff167d98ca", "url": "https://stripe.com/jobs/listing/account-executive-commercial/5403149", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -381,8 +381,8 @@ "id": "0880ea91-7c5e-415c-9d2f-00457f110ee8", "url": "https://careers.doordash.com/jobs/5462166", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -408,8 +408,8 @@ "id": "a266e560-aa88-49fe-b3c0-2731163b1921", "url": "https://jobs.netflix.com/jobs/301592752", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -435,8 +435,8 @@ "id": "db0872df-fd27-4fff-bce8-3513f8e1164d", "url": "https://scale.com/careers/4314568005", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -462,8 +462,8 @@ "id": "574db794-8055-4fe6-bd16-5f9ee6eccbb4", "url": "https://bb.wd3.myworkdayjobs.com/en-US/BlackBerry/jobs/details/Territory-Account-Manager_20231252", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -489,8 +489,8 @@ "id": "a4e1ac68-35bc-44a6-9e5f-53785df53bf2", "url": "https://careers.roblox.com/jobs/4979622", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -516,8 +516,8 @@ "id": "c0028644-9bfa-470e-9efd-d8473b42e313", "url": "https://www.northside.com/locations/atlanta-ophthalmology-associates", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -537,8 +537,8 @@ "id": "111ebd24-8617-48cb-b963-eb692bf1e53a", "url": "https://www.baptistfirst.org/location/baptist-health-ent-partners", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -558,8 +558,8 @@ "id": "270c2ebd-96c0-4bab-a24c-2c38a2df20aa", "url": "https://www.mymichigan.org/locations/profile/?id=2918&searchId=850eff7c-3b7f-ee11-a863-000d3a61151d&sort=11&page=4&pageSize=10", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -579,8 +579,8 @@ "id": "ed7b1cf6-5be4-40e7-ad00-89a67d1c8e40", "url": "https://www.uchealth.com/en/locations/montgomery-building", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -600,8 +600,8 @@ "id": "5df3d301-09f0-4ece-946d-c24952069ab7", "url": "https://uoflhealth.org/locations/gi-motility-clinic-gastroenterology/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -621,8 +621,8 @@ "id": "18b0b51e-196c-4765-bd70-aecff53f7e4d", "url": "https://www.garnethealth.org/locations", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -684,8 +684,8 @@ "id": "db3fb266-a2cc-41bd-8995-1bdf2dd647fc", "url": "https://www.healthpartners.com/care/find/locations/?sort=name", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -720,8 +720,8 @@ "id": "dcad6730-1eb2-4df7-afb7-9b034afb2f04", "url": "https://www.heywood.org/locations", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -753,8 +753,8 @@ "id": "174b1151-ea9a-4745-bc88-8c56ffc23131", "url": "https://www.hhc.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -781,8 +781,8 @@ "id": "9aa944d7-257b-4451-9958-feddfb7bd250", "url": "https://www.huntregional.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -806,8 +806,8 @@ "id": "18c29ec8-de1d-4015-aeb5-92129b9bba6c", "url": "https://iuhealth.org/find-locations/results?query=&page=1", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -834,8 +834,8 @@ "id": "a10f13b0-e4f1-490a-9fa1-64082d15e087", "url": "https://www.infirmaryhealth.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -947,8 +947,8 @@ "id": "97022d6c-f9d6-4481-85c8-2a9d9779e7b9", "url": "https://www.legacyhealth.org/doctors-and-locations.aspx?Latitude=&Longitude=&SearchType=LOCATIONS&keyword=&ActiveLocationTypeFilter=&services=&ZipCode=&Radius=5&PageNumber=1&PatientAge=&Specialties=&Gender=&Locations=&IsLHPMember=&OpenWeekends=undefined&Open24Hours=undefined", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -988,8 +988,8 @@ "id": "41147504-625d-45d5-9689-92218fdd32b5", "url": "https://www.lifespan.org/locations", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1014,8 +1014,8 @@ "id": "c713976a-fd1d-4577-9956-c2a3ab295ead", "url": "https://www.lcmchealth.org/our-locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1232,8 +1232,8 @@ "id": "47b45f41-2b7e-4295-ac0c-93f02354cd93", "url": "https://www.hawaiipacifichealth.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "Fetch all of the links to the detail pages of clinics", "evals": [ @@ -1279,8 +1279,8 @@ "id": "97dc7166-7dcb-4c9f-941f-342996bf1ca8", "url": "https://www.mountsinai.org/locations", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "Fetch all of the links to the detail pages of clinics", "evals": [ @@ -1314,8 +1314,8 @@ "id": "29cc4cad-f85c-4d8f-952e-f41f7eb2bc73", "url": "https://www.acuityhealthcare.net/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "Fetch all of the links to the detail pages of clinics", "evals": [ @@ -1335,8 +1335,8 @@ "id": "bb50f4e4-7d66-4ba6-b613-1065ea58a6fc", "url": "https://www.adventisthealthcare.com/locations/results/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1361,8 +1361,8 @@ "id": "1e4d7ca6-5292-4857-aca6-bd0fff337435", "url": "https://apprhs.org/our-locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1404,8 +1404,8 @@ "id": "c45a5a21-964c-422c-96a9-acbfdebc64bc", "url": "https://www.archbold.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1468,8 +1468,8 @@ "id": "f9e89327-3556-492d-963d-3765eebdbb1d", "url": "https://www.arnothealth.org/hospitals", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1487,8 +1487,8 @@ "id": "3724f66f-9743-499c-a4b5-7b7f32d9e2a4", "url": "https://www.astria.health/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1538,8 +1538,8 @@ "id": "3ee0e369-1cd7-41ac-940c-bee1afc1ef26", "url": "https://www.atlantichealth.org/locations/hospitals.html", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1561,8 +1561,8 @@ "id": "ce4dede3-9fee-44ea-99a6-0137a9aa2db8", "url": "https://www.swedish.org/locations?lookup=87af2959065c4704b21c5064dada6bfd&lookupvalue=Urgent%20Care&page=1&radius=&term=", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1580,8 +1580,8 @@ "id": "998ed1f9-a3a8-4e85-9863-ccfa8d21d9a6", "url": "https://www.seielect.com/?stockcheck=ASR1JA330R", "source": "mhtml", - "domain": "manufacturing", - "subdomain": "commerce", + "category": "manufacturing", + "subcategory": "commerce", "type": "fetch", "fetch_id": "manufacturing_commerce", "evals": [ @@ -1597,8 +1597,8 @@ "id": "18f93ec4-086c-467c-a952-8565d8005742", "url": "https://www.kemet.com/en/us/capacitors/ceramic/product/CGP5C472MHWDAA7301.html", "source": "mhtml", - "domain": "manufacturing", - "subdomain": "commerce", + "category": "manufacturing", + "subcategory": "commerce", "type": "fetch", "fetch_id": "manufacturing_commerce", "evals": [ @@ -1614,8 +1614,8 @@ "id": "cd1ba388-8732-49e0-a5b1-09691aad999d", "url": "https://www.infineon.com/cms/en/product/power/mosfet/silicon-carbide/modules/df14mr12w1m1hf_b67/", "source": "mhtml", - "domain": "manufacturing", - "subdomain": "commerce", + "category": "manufacturing", + "subcategory": "commerce", "type": "fetch", "fetch_id": "manufacturing_commerce", "evals": [ @@ -1631,8 +1631,8 @@ "id": "6ad8593d-547d-4591-b4d5-a7cc42feeed4", "url": "https://www.nexperia.com/products/diodes/automotive-diodes/automotive-zener-diodes/BZX585-C6V8-Q.html", "source": "mhtml", - "domain": "manufacturing", - "subdomain": "commerce", + "category": "manufacturing", + "subcategory": "commerce", "type": "fetch", "fetch_id": "manufacturing_commerce", "evals": [ @@ -1648,8 +1648,8 @@ "id": "974d2768-776c-4157-8e6d-aea8bb22f832", "url": "https://www.capecodhealth.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1674,8 +1674,8 @@ "id": "bdf05e0f-fe5f-4b0c-b750-a176d274d281", "url": "https://www.catholichealthservices.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1704,8 +1704,8 @@ "id": "8bf5db6d-3df6-464b-92b0-c0a04317feec", "url": "https://www.mycmh.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1755,8 +1755,8 @@ "id": "a2a07987-e9da-434d-9190-07a2e74c9600", "url": "https://dchsystem.com/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1782,8 +1782,8 @@ "id": "6d744ee4-bfb8-4061-badd-8ffa7e954e0f", "url": "https://ernesthealth.com/our-hospitals/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1833,8 +1833,8 @@ "id": "fe899480-b3d1-4c28-a91f-a7c63b05c940", "url": "https://excelahealth.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1966,8 +1966,8 @@ "id": "62bca094-6cff-4cc5-8592-71d283babfa6", "url": "https://www.frhs.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -1992,8 +1992,8 @@ "id": "361cdcca-41ed-4afd-b9fb-d7f98289d4fb", "url": "https://www.flhealth.org/locations/location-search-results?SearchPattern=Contains&LocationDescendants=true", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -2018,8 +2018,8 @@ "id": "d5df56b5-f0bd-4d69-8cb5-11edfbf4568e", "url": "https://www.freemanhealth.com/all-locations", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -2098,8 +2098,8 @@ "id": "a4593517-4ff7-40dd-b100-e24b90c72819", "url": "https://www.froedtert.com/locations", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -2135,8 +2135,8 @@ "id": "3692abd6-a2d1-4148-bd85-8993e9e2db81", "url": "https://www.capecodhealth.org/locations/profile/cape-cod-surgery-center/?searchId=b8a9e746-eb81-ee11-a867-000d3a611c21&sort=11&page=1&pageSize=10", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2156,8 +2156,8 @@ "id": "3b13610f-9bf2-44ad-b223-f5db5a6e259a", "url": "https://whiteriverhealth.org/doctors/facilities/38/orthopaedics-batesville", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2177,8 +2177,8 @@ "id": "4e974283-6ad8-4c6d-9788-0aff49ab0a57", "url": "https://www.wth.org/locations/west-tennessee-interventional-pain-dyersburg/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2198,8 +2198,8 @@ "id": "3c99030a-088b-42fc-bab6-84972afb65b5", "url": "https://www.selectspecialtyhospitals.com/locations-and-tours/wv/wheeling/wheeling/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2219,8 +2219,8 @@ "id": "afc8133f-a641-46fe-bf93-5b98d8e6cea3", "url": "https://whs.org/locations/childrens-therapy-center/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2240,8 +2240,8 @@ "id": "17d5678f-05ac-4bd4-b52b-79e6a710f8f1", "url": "https://www.wakemed.org/location/gastroenterology-north-raleigh", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2261,8 +2261,8 @@ "id": "180a3e5f-1cd7-4073-bf02-3dc663a6d41e", "url": "https://www.virtua.org/locations/surgicare-of-central-jersey", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2282,8 +2282,8 @@ "id": "5b3eb94e-3e5c-4c39-832c-48c25f38a8b8", "url": "https://locations.ecuhealth.org/Details/46?Index=3&_gl=1*8joxuy*_ga*MTYyMTMxNzA4Mi4xNjk5NjYzOTgz*_ga_4RQPPRT99M*MTY5OTY2Mzk4My4xLjAuMTY5OTY2Mzk4My4wLjAuMA..", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2303,8 +2303,8 @@ "id": "f6c00da0-3976-457b-982c-3efdea0ff7bb", "url": "https://veritascollaborative.com/locations/north-carolina/durham-nc-adult-eating-disorder-treatment-center/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2324,8 +2324,8 @@ "id": "583c1f78-16aa-4eee-ae29-4277f4495ea1", "url": "https://www.vcuhealth.org/locations/location-details?id=33", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2345,8 +2345,8 @@ "id": "88ac8af0-d461-4c7f-8498-d7d53d65e3c0", "url": "https://search.vanderbilthealth.com/locations/vanderbilt-bill-wilkerson-center-franklin", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2366,8 +2366,8 @@ "id": "b81f0252-ecca-4dda-a7e1-dcdc48d0db2c", "url": "https://www.valleyhealthlink.com/our-locations/valley-health-page-memorial-hospital-multispecia/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2387,8 +2387,8 @@ "id": "c8ebee22-eeac-4479-9ca6-aebb1efc3a2f", "url": "https://www.uwmedicine.org/locations/northwest-hospital", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2408,8 +2408,8 @@ "id": "9d2df10f-4f04-4968-8227-c8a12f74b63d", "url": "https://www.uwhealth.org/locations/uw-health-specialty-clinic-sauk-prairie-270/optometry-clinic-1048", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2429,8 +2429,8 @@ "id": "ae5045c0-b6c2-40a3-9dab-bfafadb1f1ed", "url": "https://uvahealth.com/locations/UVA-Medical-Park-Zion-Crossroads-5597275", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2450,8 +2450,8 @@ "id": "f436cee3-06d1-472e-b98b-615905e41c52", "url": "https://www.usahealthsystem.com/locations/cardiac-catheterization-lab", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2471,8 +2471,8 @@ "id": "0fe1cf15-d5fb-416c-9e1b-f5cae188d088", "url": "https://uoflhealth.org/locations/uofl-health-hep-c-center/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2492,8 +2492,8 @@ "id": "4d167753-d180-497d-8510-02ab26f3a0f7", "url": "https://www.pennmedicine.org/for-patients-and-visitors/penn-medicine-locations/pennsylvania-hospital", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2513,8 +2513,8 @@ "id": "d401233f-2d50-426f-bf77-004411a19d6d", "url": "https://www.kansashealthsystem.com/locations/center-for-advanced-vascular-care-overland-park-ks", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2534,8 +2534,8 @@ "id": "e0ce7070-8cb3-416a-8090-7a6a186b4e8a", "url": "https://www.uchicagomedicine.org/comer/find-a-location/uchicago-medicine-comer-childrens-merrillville", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2555,8 +2555,8 @@ "id": "c95632a7-31a8-4177-9361-d07bdd809a7a", "url": "https://www.slhduluth.com/locations/st-lukes-interventional-pain-management/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2576,8 +2576,8 @@ "id": "a33c17c6-b2cd-433f-8972-09b969667866", "url": "https://www.arnothealth.org/st-josephs-hospital", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -2597,8 +2597,8 @@ "id": "cb25b8d2-1ac6-43d5-930f-70edeccf34f9", "url": "https://www.hackensackmeridianhealth.org/en/location-search#sort=%40locationname%20ascending&f:@locationtype=[Hospitals%20and%20Emergency%20Departments]", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2612,8 +2612,8 @@ "id": "2ac79ff2-a923-49df-9e66-5ce7f9d5d0e4", "url": "https://www.uchicagomedicine.org/find-a-location?page=5&sortby=default", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2627,8 +2627,8 @@ "id": "d76159ad-f62a-49e1-9896-df5ef91dcb5f", "url": "https://www.adventisthealthcare.com/locations/results/?searchId=7402b4ad-5a84-ee11-a85e-000d3a611ea2&sort=13&page=5", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2642,8 +2642,8 @@ "id": "17c411ab-5586-4cd7-940c-514959796b4f", "url": "https://www.providence.org/locations?lookup=25d90ac1a9024e7298afb10aff38bd76&lookupvalue=Hospitals&postal=V3Z&latlng=49.1049,-122.824&page=4", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2657,8 +2657,8 @@ "id": "6d85220a-b86e-4b85-96c8-0fb94447cf29", "url": "https://www.baptistfirst.org/find-a-location/?page=4&count=10", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2672,8 +2672,8 @@ "id": "6b9054b1-c67c-46cc-bd67-7dfd29a9ebf1", "url": "https://www.mhs.net/locations?listPage=2", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2687,8 +2687,8 @@ "id": "a316a94d-7ad6-4385-a2e0-4b47e1f1a661", "url": "https://whs.org/locations-practices/search-results/", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2702,8 +2702,8 @@ "id": "8fc4b97d-f823-4c31-b50f-ad42671fe2b1", "url": "https://www.shrinerschildrens.org/en/locations?listPage=1", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2717,8 +2717,8 @@ "id": "b572a5e4-717b-41ab-86e3-ec41cac368b3", "url": "https://www.sih.net/locations?page=1&perpage=25&q=&serv=&dist=&zip=&sort=Ascending&view=list", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2732,8 +2732,8 @@ "id": "b2a98bed-bce2-404a-9b6b-ff27d28a6c1f", "url": "https://www.mercyone.org/find-a-location/locations-results?LocationText=&page=54&count=9", "source": "hosted", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "navigate", "goal": "You are currently on a listing page. Use pagination controls to travel to the last available listing page if possible ", "evals": [ @@ -2747,8 +2747,8 @@ "id": "798be63a-06df-494e-a1b1-a021bec4882e", "url": "https://community.openai.com/t/how-to-address-a-gpt-in-its-instructions/513763", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2770,8 +2770,8 @@ "id": "6adb9aad-6d42-4366-a6a9-f5ae958889d7", "url": "https://twitter.com/asimdotshrestha/status/1728466080811909126", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2793,8 +2793,8 @@ "id": "75ce3f5e-1dd4-42bf-8620-44a6b5bc0f78", "url": "https://news.ycombinator.com/item?id=38434914", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2815,8 +2815,8 @@ "id": "1d7f793c-5c51-487a-86e7-dd68a478b16a", "url": "https://www.gamespot.com/forums/system-wars-314159282/so-robocop-game-is-not-bad-33610315/", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2837,8 +2837,8 @@ "id": "7bc386a7-0d5b-45dc-ab10-8189451379a6", "url": "https://stackoverflow.com/questions/77529741/custom-jscript-event-alway-returns-undefined-in-ga4-gtm-debug-any-ideas", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2860,8 +2860,8 @@ "id": "9e1761b8-e5bd-4e96-b47e-8ff11bfadbc0", "url": "https://www.tripadvisor.com/ShowTopic-g28926-i29-k14574554-6_Weeks_in_California_and_Vegas-California.html", "source": "mhtml", - "domain": "travel", - "subdomain": "forum", + "category": "travel", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2883,8 +2883,8 @@ "id": "4a7dac8a-ff74-4e36-8edf-41ebaa30790d", "url": "https://www.warriorforum.com/social-media/1447913-p-g-takes-first-step-into-metaverse-beautysphere.html?utm_source=internal&utm_medium=discussion-list&utm_campaign=feed&utm_term=title", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2906,8 +2906,8 @@ "id": "01d6fabd-adaf-4a4e-9990-0db26ea206ed", "url": "https://forums.premed101.com/topic/53408-what-counts-as-full-courseload/", "source": "mhtml", - "domain": "education", - "subdomain": "forum", + "category": "education", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2929,8 +2929,8 @@ "id": "17c261ff-3f04-4fcf-bccd-90df4d043e61", "url": "https://forums.redflagdeals.com/1366-vs-1150-a-1388015/", "source": "mhtml", - "domain": "e-commerce", - "subdomain": "forum", + "category": "e-commerce", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2952,8 +2952,8 @@ "id": "d0164f97-f6a3-403f-acbb-a9784194ef17", "url": "https://www.f150forum.com/f69/9-28-17-build-date-395413/", "source": "mhtml", - "domain": "automotive", - "subdomain": "forum", + "category": "automotive", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2975,8 +2975,8 @@ "id": "ad07bc26-794c-4264-8122-2aae31c383ef", "url": "https://patient.info/forums/discuss/tingling-in-my-hands-and-cheeks-with-a-sore-throat-and-red-dots-on-roof-of-mouth-and-sores-on-cheeks-739597", "source": "mhtml", - "domain": "healthcare", - "subdomain": "forum", + "category": "healthcare", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -2998,8 +2998,8 @@ "id": "47a75c05-fc65-4a7c-b98c-d9438a5f8988", "url": "https://www.teamblind.com/post/Stop-f-around-start-your-own-company-hkcNxAgX", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -3021,8 +3021,8 @@ "id": "03a77421-5216-4862-bc1d-02a8012d36cd", "url": "https://community.adobe.com/t5/photoshop-elements-discussions/restore-catalog-from-sd-cards/m-p/13612011#M88645", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -3044,8 +3044,8 @@ "id": "854eb702-93f1-42c2-8d07-16d7b776cc38", "url": "https://community.startupnation.com/discussion/14445/what-is-the-best-way-to-get-funding-for-your-start-up-or-idea", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -3067,8 +3067,8 @@ "id": "a72534ac-79ea-4e94-9a76-2928ae2342b8", "url": "https://www.indiehackers.com/post/generating-200k-monthly-revenue-with-an-online-photo-editor-ad36e6538e", "source": "mhtml", - "domain": "software", - "subdomain": "forum", + "category": "software", + "subcategory": "forum", "type": "fetch", "fetch_id": "forum", "evals": [ @@ -3090,8 +3090,8 @@ "id": "1534f6a2-81ed-48ff-b118-a4d752dae524", "url": "https://openai.com/careers/ai-policy-counsel", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -3117,8 +3117,8 @@ "id": "fb3e1776-3a8a-41da-b077-bff601723a70", "url": "https://openai.com/careers/data-infrastructure-engineer", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -3144,8 +3144,8 @@ "id": "7614e6a7-7d69-4f59-879a-4288ca319bee", "url": "https://openai.com/careers/engineering-manager-fine-tuning-api", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -3171,8 +3171,8 @@ "id": "0f8d967e-07a9-450a-b6b9-c60ad4c07ec7", "url": "https://openai.com/careers/head-of-commercial-legal", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -3198,8 +3198,8 @@ "id": "ab4689a7-cf62-473d-bfa0-5d8aa1b78d87", "url": "https://www.accenture.com/us-en/careers/jobdetails?id=11789141_en&title=Director%20of%20Medicare%20Claims", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -3225,8 +3225,8 @@ "id": "d2bffe5e-ccda-4ec7-bbab-4827da462bf9", "url": "https://www.accenture.com/us-en/careers/jobdetails?id=R00186436_en&title=MES%20PharmaSuite%20Engineer", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -3252,8 +3252,8 @@ "id": "75d8750c-7042-4079-b782-1448475d724e", "url": "https://www.accenture.com/us-en/careers/jobdetails?id=11770326_en&title=Payroll%20Operations%20Manager", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ @@ -3279,8 +3279,8 @@ "id": "e99a7fb9-360e-4949-9d04-73b655502d3d", "url": "https://www.accenture.com/us-en/careers/jobdetails?id=R00185110_en&title=T%26D%20Grid%20Operations%20Consultant", "source": "mhtml", - "domain": "software", - "subdomain": "careers", + "category": "software", + "subcategory": "careers", "type": "fetch", "fetch_id": "job_posting", "evals": [ diff --git a/static/test_examples.json b/static/test_examples.json index 223016d4..57ac31f8 100644 --- a/static/test_examples.json +++ b/static/test_examples.json @@ -3,8 +3,8 @@ "id": "83e3aff0-8447-4c67-9d4c-18ce8954585a", "url": "https://www.mmchs.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -44,8 +44,8 @@ "id": "db2c9d7a-7c76-441a-a21b-c2bfe200407d", "url": "https://www.mhsystem.org/ourlocations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -73,8 +73,8 @@ "id": "65e9b04a-7833-43f3-877d-ae27a02eed70", "url": "https://www.mhs.net/locations?listPage=1", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -99,8 +99,8 @@ "id": "c6bee4be-3394-4867-b5a8-52d6e9901e62", "url": "https://www.memorialcare.org/locations", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -315,8 +315,8 @@ "id": "135502cc-bdaf-4f36-a2d5-4023a331aa6a", "url": "https://www.mercy.net/search/location/?q=&locationType=&locationOfferings=&servicesOffered=&solrsort=&distance=25&page=1", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -341,8 +341,8 @@ "id": "36601c8a-255c-4f64-b723-3694d1c9dcc1", "url": "https://www.methodisthealth.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -372,8 +372,8 @@ "id": "073862e2-e519-42cb-8cb0-d9e419a33a1b", "url": "https://www.mymichigan.org/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -398,8 +398,8 @@ "id": "953ff6ad-d115-499f-9e51-bed7b638ad41", "url": "https://www.duncanregional.com/locations/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -421,8 +421,8 @@ "id": "5cc195cf-ac77-46ef-a9ac-f96887c8a50f", "url": "https://www.dukehealth.org/locations?sc=30&view=list", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "links", "goal": "You are viewing a listing page of a website that aggregates information about clinics. Your goal is to scrape all of the links to the detail pages of clinics on the current page", "evals": [ @@ -467,8 +467,8 @@ "id": "e6067e2c-efd3-4ae4-a766-a1a846c678ad", "url": "https://www.universityhealthkc.org/locations/university-health-oral-maxillofacial-surgery-clinic/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -488,8 +488,8 @@ "id": "ede570fd-c859-47bc-8432-7d0e7a25139e", "url": "https://www.unitypoint.org/locations/allen-womens-health", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -509,8 +509,8 @@ "id": "238f430b-824a-46e9-8f2e-5fa08176a0e0", "url": "https://www.nyuhs.org/location-search/adult-community-free-clinic-uhs-primary-care-binghamton", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -530,8 +530,8 @@ "id": "d0f2dd50-db96-475a-ae1f-57acba811fae", "url": "https://uniongeneralhealthsystem.com/facility/hayesville-family-practice/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -551,8 +551,8 @@ "id": "ef217309-7c87-45f9-931c-fc662d55646a", "url": "https://www.uabmedicine.org/locations/gardendale-primary-care/", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -572,8 +572,8 @@ "id": "6088d589-a01d-4360-a3e5-c22e7a9baed4", "url": "https://towerhealth.org/locations/st-christophers-pediatric-associates-registered-dieticians", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -593,8 +593,8 @@ "id": "0de6f7ca-3eba-45d9-990d-3255955c38e6", "url": "https://www.tidelandshealth.org/locations/profile/myrtlebeachfamilymed/?searchId=bf5cebce-5983-ee11-a860-000d3a611816&sort=11&page=5&pageSize=10", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -614,8 +614,8 @@ "id": "4cd7de7b-5cf9-48aa-b1c9-be1858eb0a26", "url": "https://www.sutterhealth.org/find-location/facility/brentwood-center-lab", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -635,8 +635,8 @@ "id": "bc7d1f13-811d-42a5-a3f7-49175675a54e", "url": "https://findalocation.slhn.org/practice/details/11251?theme=dir_sluhn", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ @@ -656,8 +656,8 @@ "id": "ca386162-ee75-485e-8f9d-13d488fc477a", "url": "https://www.stlukesonline.org/communities-and-locations/facilities/clinics/st-lukes-clinic-lifestyle-medicine-twin-falls-addison-ave", "source": "mhtml", - "domain": "healthcare", - "subdomain": "contact", + "category": "healthcare", + "subcategory": "contact", "type": "fetch", "fetch_id": "contact", "evals": [ diff --git a/tests/test_example_eval.py b/tests/test_example_eval.py index 681e70b2..20e9e5e9 100644 --- a/tests/test_example_eval.py +++ b/tests/test_example_eval.py @@ -111,8 +111,8 @@ def create_default_example( "id": "1", "url": "url", "source": "mhtml", - "domain": "domain", - "subdomain": "subdomain", + "category": "category", + "subcategory": "subcategory", "type": "fetch", "evals": [], "fetch_id": None, # Set as None by default diff --git a/tests/test_generator.py b/tests/test_generator.py index 3140725a..f9d6a6b8 100644 --- a/tests/test_generator.py +++ b/tests/test_generator.py @@ -9,8 +9,8 @@ def test_generate_test_with_single_eval() -> None: id="1", url="https://www.test.com", source="mhtml", - domain="test", - subdomain="www", + category="test", + subcategory="www", type="fetch", evals=[Eval(type="json_match", expected={"key": "value"})], fetch_id="job_posting", @@ -26,8 +26,8 @@ def test_generate_test_with_multiple_evals() -> None: id="1", url="https://www.test.com", source="mhtml", - domain="test", - subdomain="www", + category="test", + subcategory="www", type="fetch", evals=[ Eval(type="json_match", expected={"key": "value"}), @@ -47,8 +47,8 @@ def test_generate_class_name_without_www() -> None: id="1", url="https://test.com", source="mhtml", - domain="test", - subdomain="www", + category="test", + subcategory="www", type="fetch", evals=[], fetch_id="job_posting", @@ -64,8 +64,8 @@ def test_generate_class_name_with_www() -> None: id="1", url="https://www.test.com", source="mhtml", - domain="test", - subdomain="www", + category="test", + subcategory="www", type="fetch", evals=[], fetch_id="job_posting", @@ -75,14 +75,14 @@ def test_generate_class_name_with_www() -> None: assert class_name == "TestFetchTestCom" -def test_generate_class_name_with_multiple_domains() -> None: +def test_generate_class_name_with_multiple_categorys() -> None: generator = PytestTestGenerator() example1 = Example( id="1", url="https://test.com", source="mhtml", - domain="test", - subdomain="www", + category="test", + subcategory="www", type="fetch", evals=[], fetch_id="job_posting", @@ -92,8 +92,8 @@ def test_generate_class_name_with_multiple_domains() -> None: id="2", url="https://test.com", source="mhtml", - domain="test", - subdomain="www", + category="test", + subcategory="www", type="fetch", evals=[], fetch_id="job_posting", diff --git a/tests/test_runner.py b/tests/test_runner.py index 6cc117bf..1e58b02f 100644 --- a/tests/test_runner.py +++ b/tests/test_runner.py @@ -28,9 +28,9 @@ def example(): return Example( id="test", url="https://example.com", - subdomain="test", + subcategory="test", type="links", - domain="test", + category="test", goal="links", source="hosted", evals=[],