{"payload":{"header_redesign_enabled":false,"results":[{"id":"541798154","archived":false,"color":"#e34c26","followers":6853,"has_funding_file":false,"hl_name":"Unstructured-IO/unstructured","hl_trunc_description":"Open source libraries and APIs to build custom preprocessing pipelines for labeling, training, or production machine learning pipelines. ","language":"HTML","mirror":false,"owned_by_organization":true,"public":true,"repo":{"repository":{"id":541798154,"name":"unstructured","owner_id":108372208,"owner_login":"Unstructured-IO","updated_at":"2024-05-22T00:26:55.910Z","has_issues":true}},"sponsorable":false,"topics":["nlp","pdf","machine-learning","natural-language-processing","information-retrieval","ocr","deep-learning","ml","docx","preprocessing","pdf-to-text","data-pipelines","donut","document-image-processing","document-parser","pdf-to-json","document-image-analysis","llm","document-parsing","langchain"],"type":"Public","help_wanted_issues_count":0,"good_first_issue_issues_count":4,"starred_by_current_user":false}],"type":"repositories","page":1,"page_count":1,"elapsed_millis":63,"errors":[],"result_count":1,"facets":[],"protected_org_logins":[],"topics":null,"query_id":"","logged_in":false,"sign_up_path":"/signup?source=code_search_results","sign_in_path":"/login?return_to=https%3A%2F%2Fgithub.com%2Fsearch%3Fq%3Drepo%253AUnstructured-IO%252Funstructured%2B%2Blanguage%253AHTML","metadata":null,"csrf_tokens":{"/Unstructured-IO/unstructured/star":{"post":"T1ZH0HYac_MxSWbnbQj12aGV-NciEHgQ_mQRFBsS3-rINtQ-YY1WchSgXLjPI_hI9nvCd4CH0f9IwJyN6CcSKQ"},"/Unstructured-IO/unstructured/unstar":{"post":"Saw_pVC-UgTY0cljPDNhGQMBSwdz4Y0F5X18_d1aBx-h1ytZZkX-HfRiw0t7eYPayFY4Sb4TxY_-SYsJ2ziKwA"},"/sponsors/batch_deferred_sponsor_buttons":{"post":"uWTVSc7JYQY6m_rJ5SZ0TjZojXKG9SoOgP-B3f-6XV0Fq2aNAs1unJXFEIqRbet2Zb4qrHES5AzDtiEWngmhWA"}}},"title":"Repository search results"}