{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"unstructured-inference","owner":"Unstructured-IO","isFork":false,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":15,"issueCount":13,"starsCount":117,"forksCount":32,"license":"Apache License 2.0","participation":[1,1,3,0,3,4,8,3,3,4,2,4,5,3,4,4,3,10,4,3,10,8,2,5,1,6,1,2,2,1,4,0,0,1,1,0,0,1,1,0,0,1,2,2,0,2,0,2,1,2,3,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T06:31:08.683Z"}},{"type":"Public","name":"unstructured","owner":"Unstructured-IO","isFork":false,"description":"Open source libraries and APIs to build custom preprocessing pipelines for labeling, training, or production machine learning pipelines. ","topicNames":["nlp","pdf","machine-learning","natural-language-processing","information-retrieval","deep-learning","ml","docx","preprocessing","pdf-to-text"],"topicsNotShown":10,"allTopics":["nlp","pdf","machine-learning","natural-language-processing","information-retrieval","deep-learning","ml","docx","preprocessing","pdf-to-text","data-pipelines","donut","document-image-processing","document-parser","pdf-to-json","document-image-analysis","llm","document-parsing","langchain","ocr"],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":27,"issueCount":190,"starsCount":6840,"forksCount":519,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T06:27:37.491Z"}},{"type":"Public","name":"unstructured-js-client","owner":"Unstructured-IO","isFork":false,"description":"A Typescript client for the Unstructured hosted API","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":3,"issueCount":6,"starsCount":23,"forksCount":5,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,27,21,3,2,6,6,2,7,2,0,1,1,2,0,0,5,0,0,2,0,0,7,3,1,0,5,2,0,5,1,0,0,2,4,2],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T00:23:05.317Z"}},{"type":"Public","name":"docs","owner":"Unstructured-IO","isFork":false,"description":"Documentation for all Unstructured products and libraries","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"MDX","color":"#fcb32c"},"pullRequestCount":3,"issueCount":1,"starsCount":1,"forksCount":2,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,11,6,10,4,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T19:48:52.924Z"}},{"type":"Public","name":"unstructured-python-client","owner":"Unstructured-IO","isFork":false,"description":"A Python client for the Unstructured hosted API","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":3,"starsCount":46,"forksCount":6,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,11,33,45,18,0,7,5,6,4,6,7,4,1,4,4,8,0,6,4,7,6,10,21,6,1,4,4,1,1,2,4,0,0,1,5,6,2],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T12:39:24.814Z"}},{"type":"Public","name":"unstructured-api","owner":"Unstructured-IO","isFork":false,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":25,"starsCount":384,"forksCount":78,"license":"Apache License 2.0","participation":[2,5,3,4,6,7,3,4,6,2,6,1,4,10,2,16,8,8,9,6,7,5,4,4,3,4,0,1,6,0,2,0,1,2,7,6,0,3,1,3,4,2,2,6,0,2,2,0,0,3,6,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-12T18:51:44.828Z"}},{"type":"Public","name":"base-images","owner":"Unstructured-IO","isFork":false,"description":"Store Dockerfiles and Packer configs for images to use as a base to build upon","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":1,"issueCount":1,"starsCount":0,"forksCount":0,"license":"Apache License 2.0","participation":[0,10,0,2,0,29,9,0,2,0,0,0,0,1,8,1,0,0,1,0,0,0,1,2,6,0,0,2,0,0,0,0,0,0,2,0,0,2,0,1,0,0,0,1,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-09T17:37:40.942Z"}},{"type":"Public","name":".github","owner":"Unstructured-IO","isFork":false,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":null,"pullRequestCount":1,"issueCount":1,"starsCount":0,"forksCount":2,"license":null,"participation":[0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-13T17:03:55.269Z"}},{"type":"Public","name":"pipeline-sec-filings","owner":"Unstructured-IO","isFork":false,"description":"Preprocessing pipeline notebooks and API supporting text extraction from SEC documents","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":7,"issueCount":5,"starsCount":133,"forksCount":25,"license":"Apache License 2.0","participation":[0,2,0,0,1,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-01T14:22:11.008Z"}},{"type":"Public","name":"pipeline-template","owner":"Unstructured-IO","isFork":false,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":4,"issueCount":0,"starsCount":8,"forksCount":6,"license":"Apache License 2.0","participation":[0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-02T07:43:40.959Z"}},{"type":"Public","name":"pipeline-oer","owner":"Unstructured-IO","isFork":false,"description":"Pipeline for extraction information from Army OERs","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":6,"issueCount":1,"starsCount":7,"forksCount":4,"license":"Apache License 2.0","participation":[0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-01T18:30:30.826Z"}},{"type":"Public","name":"unstructured.PaddleOCR","owner":"Unstructured-IO","isFork":true,"description":"Awesome multilingual OCR toolkits based on PaddlePaddle (practical ultra lightweight OCR system, support 80+ languages recognition, provide data annotation and synthesis tools, support training and deployment among server, mobile, embedded and IoT devices)","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":17,"forksCount":7323,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,9,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-11T22:17:50.110Z"}},{"type":"Public","name":"unstructured.pytesseract","owner":"Unstructured-IO","isFork":true,"description":"A Python wrapper for Google Tesseract","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":699,"license":"Apache License 2.0","participation":[0,0,0,2,1,1,0,2,2,0,2,0,0,13,4,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-05T17:53:08.478Z"}},{"type":"Public","name":"pipeline-paddleocr","owner":"Unstructured-IO","isFork":false,"description":"Pipeline for converting PDFs to raw text with PaddleOCR","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":5,"issueCount":1,"starsCount":14,"forksCount":5,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-21T01:45:59.434Z"}},{"type":"Public","name":"langchain","owner":"Unstructured-IO","isFork":true,"description":"⚡ Building applications with LLMs through composability ⚡","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":9,"forksCount":13206,"license":"MIT License","participation":[116,128,106,120,145,115,178,128,158,159,149,159,93,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-18T19:36:45.228Z"}},{"type":"Public archive","name":"unstructured-api-tools","owner":"Unstructured-IO","isFork":false,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":2,"starsCount":28,"forksCount":9,"license":"Apache License 2.0","participation":[1,0,1,0,3,1,0,1,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-04T19:18:28.251Z"}},{"type":"Public","name":"terraform-aws-ecs-web-app","owner":"Unstructured-IO","isFork":true,"description":"Terraform module that implements a web app on ECS and supports autoscaling, CI/CD, monitoring, ALB integration, and much more.","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"HCL","color":"#844FBA"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":152,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-07-06T20:22:27.559Z"}},{"type":"Public","name":"terraform-aws-ecs-alb-service-task","owner":"Unstructured-IO","isFork":true,"description":"Terraform module which implements an ECS service which exposes a web service via ALB.","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"HCL","color":"#844FBA"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":190,"license":"Apache License 2.0","participation":[0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-07-06T20:20:08.031Z"}},{"type":"Public","name":"pipeline-document-layout","owner":"Unstructured-IO","isFork":false,"description":"Pipeline for layout extraction ","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":1,"starsCount":1,"forksCount":0,"license":"Apache License 2.0","participation":[0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-07-03T05:42:04.647Z"}},{"type":"Public","name":"pipeline-invoices","owner":"Unstructured-IO","isFork":false,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":5,"issueCount":0,"starsCount":4,"forksCount":1,"license":"Apache License 2.0","participation":[0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-07-01T18:51:20.903Z"}},{"type":"Public","name":"pipeline-receipts","owner":"Unstructured-IO","isFork":false,"description":"Preprocessing pipeline notebooks and API supporting text extraction from receipts images","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":6,"issueCount":0,"starsCount":1,"forksCount":1,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-20T22:07:10.214Z"}},{"type":"Public","name":"unstructured.Paddle","owner":"Unstructured-IO","isFork":true,"description":"PArallel Distributed Deep LEarning: Machine Learning Framework from Industrial Practice (『飞桨』核心框架,深度学习&机器学习高性能单机、分布式训练和跨平台部署)","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":5443,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-09T22:41:36.384Z"}},{"type":"Public","name":"irs-manual-demo","owner":"Unstructured-IO","isFork":false,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":14,"forksCount":7,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-09T19:17:25.422Z"}},{"type":"Public","name":"langchainjs","owner":"Unstructured-IO","isFork":true,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"TypeScript","color":"#3178c6"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":1865,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-01T17:23:29.147Z"}},{"type":"Public archive","name":"community","owner":"Unstructured-IO","isFork":false,"description":"Open source libraries and APIs to build custom preprocessing pipelines for labeling, training, or production machine learning pipelines.","topicNames":["open-source","community","machine-learning","deep-learning","nlp-parsing","data-pipeline","ocr-python","document-ai","preprocessing-data","document-parsing"],"topicsNotShown":0,"allTopics":["open-source","community","machine-learning","deep-learning","nlp-parsing","data-pipeline","ocr-python","document-ai","preprocessing-data","document-parsing"],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":19,"forksCount":6,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-04-07T18:57:00.441Z"}},{"type":"Public","name":"prometheus-community-helm-charts","owner":"Unstructured-IO","isFork":true,"description":"Prometheus community Helm charts","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Mustache","color":"#724b3b"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":4891,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-03-04T06:23:40.748Z"}},{"type":"Public","name":"chat-isw-reports","owner":"Unstructured-IO","isFork":true,"description":"","topicNames":[],"topicsNotShown":0,"allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":5,"forksCount":266,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-02-14T20:30:06.249Z"}}],"repositoryCount":27,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}