{"id":25368,"uuid":"517726737","full_name":"aphp/edspdf","owner":"aphp","description":"EDS-PDF is a generic, pure-Python framework for text extraction from PDF documents. It provides the machinery to use rule- or machine-learning-based approaches to classify text blocs between body and meta-data.","archived":false,"fork":false,"pushed_at":"2025-02-12T14:12:06.000Z","size":9359,"stargazers_count":63,"open_issues_count":0,"forks_count":7,"subscribers_count":3,"default_branch":"main","last_synced_at":"2026-03-29T07:23:10.805Z","etag":null,"topics":["extraction","machine-learning","pdf"],"latest_commit_sha":null,"homepage":"https://aphp.github.io/edspdf/","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"bsd-3-clause","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/aphp.png","metadata":{"files":{"readme":"README.md","changelog":"changelog.md","contributing":"contributing.md","funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":"CITATION.cff","codeowners":null,"security":null,"support":null,"governance":null,"roadmap":"docs/roadmap.md","authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2022-07-25T15:47:09.000Z","updated_at":"2026-03-25T01:02:14.000Z","dependencies_parsed_at":"2025-03-31T20:18:04.275Z","dependency_job_id":null,"html_url":"https://github.com/aphp/edspdf","commit_stats":{"total_commits":293,"total_committers":10,"mean_commits":29.3,"dds":0.621160409556314,"last_synced_commit":"5778c0e1ec01c9a0835832938cc3b49b5d051ffc"},"previous_names":["aphp/edspdf"],"tags_count":12,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosystem.code.gouv.fr/api/v1/hosts/GitHub/repositories/aphp%2Fedspdf","tags_url":"https://repos.ecosystem.code.gouv.fr/api/v1/hosts/GitHub/repositories/aphp%2Fedspdf/tags","releases_url":"https://repos.ecosystem.code.gouv.fr/api/v1/hosts/GitHub/repositories/aphp%2Fedspdf/releases","manifests_url":"https://repos.ecosystem.code.gouv.fr/api/v1/hosts/GitHub/repositories/aphp%2Fedspdf/manifests","owner_url":"https://repos.ecosystem.code.gouv.fr/api/v1/hosts/GitHub/owners/aphp","download_url":"https://codeload.github.com/aphp/edspdf/tar.gz/refs/heads/main","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":10470,"owners_count":245,"icon_url":"https://github.com/github.png","version":null,"created_at":"2024-05-17T14:54:58.822Z","updated_at":"2025-01-13T09:52:00.106Z","host_url":"https://repos.ecosystem.code.gouv.fr/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosystem.code.gouv.fr/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosystem.code.gouv.fr/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosystem.code.gouv.fr/api/v1/hosts/GitHub/owners"}}