{"id":3982053,"name":"github.com/datatogether/extract_href","ecosystem":"go","description":"extract_href is a command line tool for extracting urls from a HTML web page.\nwriting each url on a new line.\nEach matched url is:\n\nit uses a jquery-style selector to search the HTML document for elements that have an href attribute\nto construct a de-duplicated list of href attributes\nIt has three major command line options:\n\nexample use:\n```\n\n```\nthis will fetch the epa.gov url, select all \"a\" tags in the document that are a decendant of any element with the classes \"main-column\" and \"clearfix\"\nand build a deduplicated list of absolute urls using the `href` attribute of all found anchor tags. run that same command adding `-o urls.txt` to save\nthe results to a file and see output stats instead.\nPicking the right jquery selector is a bit of an art, the goal is to isolate the most general part of the page that contains all of the links\nthat you're after. For more information on jquery selectors and how they work, have a look here: https://learn.jquery.com/using-jquery-core/selecting-elements/\nWhen in doubt, it's often fine to leave the default \"a\" selector, which will generate lots of links you may not want,\nand manually remove them from the output file.","homepage":"https://github.com/datatogether/extract_href","licenses":"AGPL-3.0","normalized_licenses":["AGPL-3.0"],"repository_url":"https://github.com/datatogether/extract_href","keywords_array":[],"namespace":"github.com/datatogether","versions_count":1,"first_release_published_at":"2017-10-27T13:26:48.000Z","latest_release_published_at":"2017-10-27T13:26:48.000Z","latest_release_number":"v0.0.0-20171027132648-8967acede352","last_synced_at":"2026-03-24T00:01:34.891Z","created_at":"2022-04-12T07:53:44.162Z","updated_at":"2026-03-24T00:01:34.891Z","registry_url":"https://pkg.go.dev/github.com/datatogether/extract_href","install_command":"go get github.com/datatogether/extract_href","documentation_url":"https://pkg.go.dev/github.com/datatogether/extract_href#section-documentation","metadata":{},"repo_metadata":{"uuid":"103188784","full_name":"datatogether/extract_href","owner":"datatogether","description":"Command line tool for extracting urls from a HTML web page using a jquery-style selector","archived":true,"fork":false,"pushed_at":"2017-11-04T04:15:35.000Z","size":110,"stargazers_count":4,"open_issues_count":2,"forks_count":0,"subscribers_count":7,"default_branch":"master","last_synced_at":"2023-03-01T20:15:35.311Z","etag":null,"topics":["cli","golang","html","links"],"latest_commit_sha":null,"homepage":"","language":"Go","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"agpl-3.0","status":null,"scm":"git","pull_requests_enabled":true,"logo_url":null,"metadata":{"files":{"readme":"README.md","changelog":null,"contributing":".github/CONTRIBUTING.md","funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null}},"created_at":"2017-09-11T21:13:49.000Z","updated_at":"2023-01-28T16:43:23.000Z","dependencies_parsed_at":"2022-09-12T15:30:27.027Z","dependency_job_id":null,"html_url":"https://github.com/datatogether/extract_href","commit_stats":null,"repository_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/datatogether%2Fextract_href","tags_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/datatogether%2Fextract_href/tags","manifests_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/datatogether%2Fextract_href/manifests","owner_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/datatogether","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":108921946,"host_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names"}},"repo_metadata_updated_at":"2023-03-21T19:20:16.339Z","dependent_packages_count":0,"downloads":null,"downloads_period":null,"dependent_repos_count":0,"rankings":{"downloads":null,"dependent_repos_count":9.345852080216646,"dependent_packages_count":6.999148183520997,"stargazers_count":null,"forks_count":null,"average":8.172500131868823},"purl":"pkg:golang/github.com/datatogether/extract_href","advisories":[],"docker_usage_url":"https://docker.ecosyste.ms/usage/go/github.com/datatogether/extract_href","docker_dependents_count":null,"docker_downloads_count":null,"usage_url":"https://repos.ecosyste.ms/usage/go/github.com/datatogether/extract_href","dependent_repositories_url":"https://repos.ecosyste.ms/api/v1/usage/go/github.com/datatogether/extract_href/dependencies","status":null,"funding_links":[],"critical":null,"issue_metadata":{"last_synced_at":"2023-05-18T16:51:39.496Z","issues_count":2,"pull_requests_count":2,"avg_time_to_close_issue":129359.0,"avg_time_to_close_pull_request":463.0,"issues_closed_count":1,"pull_requests_closed_count":1,"pull_request_authors_count":1,"issue_authors_count":2,"avg_comments_per_issue":0.0,"avg_comments_per_pull_request":0.0,"merged_pull_requests_count":1,"bot_issues_count":0,"bot_pull_requests_count":0,"past_year_issues_count":0,"past_year_pull_requests_count":0,"past_year_avg_time_to_close_issue":null,"past_year_avg_time_to_close_pull_request":null,"past_year_issues_closed_count":0,"past_year_pull_requests_closed_count":0,"past_year_pull_request_authors_count":0,"past_year_issue_authors_count":0,"past_year_avg_comments_per_issue":null,"past_year_avg_comments_per_pull_request":null,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":0},"versions_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages/github.com%2Fdatatogether%2Fextract_href/versions","version_numbers_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages/github.com%2Fdatatogether%2Fextract_href/version_numbers","dependent_packages_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages/github.com%2Fdatatogether%2Fextract_href/dependent_packages","related_packages_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages/github.com%2Fdatatogether%2Fextract_href/related_packages","codemeta_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages/github.com%2Fdatatogether%2Fextract_href/codemeta","maintainers":[]}