{"payload":{"pageCount":7,"repositories":[{"type":"Public","name":"Formasaurus","owner":"scrapinghub","isFork":true,"description":"Formasaurus tells you the type of an HTML form and its fields using machine learning","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":1,"issueCount":0,"starsCount":5,"forksCount":47,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,10,9,1,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-16T16:25:31.355Z"}},{"type":"Public","name":"web-poet","owner":"scrapinghub","isFork":false,"description":"Web scraping Page Objects core library","allTopics":["python","web-scraping","hacktoberfest","page-objects"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":13,"issueCount":14,"starsCount":93,"forksCount":14,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":[0,10,7,0,0,0,0,12,0,0,0,0,0,0,0,0,0,5,0,0,0,4,3,3,0,4,15,0,2,2,0,7,10,1,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,1],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-16T07:48:36.852Z"}},{"type":"Public","name":"shub-workflow","owner":"scrapinghub","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":2,"starsCount":13,"forksCount":13,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":[4,8,0,0,8,0,1,12,0,1,4,0,13,0,0,0,0,0,0,2,2,0,4,0,0,0,0,0,0,0,4,0,0,5,0,0,0,0,0,4,2,2,0,0,0,2,4,1,0,7,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-15T19:15:17.999Z"}},{"type":"Public","name":"spidermon","owner":"scrapinghub","isFork":false,"description":"Scrapy Extension for monitoring spiders execution.","allTopics":["testing","monitoring","scraping","crawling","spiders","hacktoberfest","monitoring-tool","scrapinghub"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":5,"issueCount":38,"starsCount":524,"forksCount":94,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":[2,0,0,4,0,0,9,1,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,4,0,0,0,0,1,1,1,5,1,1,0,1,0,0,0,0,0,3],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-15T14:08:48.393Z"}},{"type":"Public","name":"scrapy-poet","owner":"scrapinghub","isFork":false,"description":"Page Object pattern for Scrapy","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":9,"starsCount":117,"forksCount":28,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":[0,1,0,0,0,1,0,24,17,9,0,0,5,0,2,13,7,10,2,1,18,10,14,0,0,5,1,6,4,4,0,1,10,6,0,0,0,0,0,0,6,0,0,0,0,0,3,0,0,4,2,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-12T14:20:40.409Z"}},{"type":"Public","name":"shublang","owner":"scrapinghub","isFork":false,"description":"Pluggable DSL that uses pipes to perform a series of linear transformations to extract data","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":23,"starsCount":15,"forksCount":8,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-09T17:32:21.207Z"}},{"type":"Public","name":"pgcontents","owner":"scrapinghub","isFork":true,"description":"A Postgres-backed ContentsManager implementation for IPython","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":2,"forksCount":82,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-09T16:04:04.295Z"}},{"type":"Public","name":"scrapinghub-entrypoint-scrapy","owner":"scrapinghub","isFork":false,"description":"Scrapy entrypoint for Scrapinghub job runner","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":9,"starsCount":25,"forksCount":16,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-08T13:48:26.829Z"}},{"type":"Public","name":"woodpecker","owner":"scrapinghub","isFork":true,"description":"An opinionated fork of the Drone CI system","allTopics":[],"primaryLanguage":{"name":"Go","color":"#00ADD8"},"pullRequestCount":5,"issueCount":0,"starsCount":0,"forksCount":347,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-07T05:54:57.146Z"}},{"type":"Public","name":"scrapinghub-stack-scrapy","owner":"scrapinghub","isFork":false,"description":"Software stack with latest Scrapy and updated deps","allTopics":[],"primaryLanguage":{"name":"Dockerfile","color":"#384d54"},"pullRequestCount":2,"issueCount":1,"starsCount":61,"forksCount":21,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-06T02:04:49.833Z"}},{"type":"Public","name":"varanus","owner":"scrapinghub","isFork":false,"description":"A command line spider monitoring tool","allTopics":["spider","monitoring","python36"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":2,"starsCount":7,"forksCount":6,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-06T01:26:15.753Z"}},{"type":"Public","name":"scrapyrt","owner":"scrapinghub","isFork":false,"description":"HTTP API for Scrapy spiders ","allTopics":["python","crawler","scraper","crawling","twisted","scrapy","webcrawler","hacktoberfest","webcrawling","hacktoberfest2021"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":24,"starsCount":824,"forksCount":161,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-28T14:25:11.389Z"}},{"type":"Public","name":"portia","owner":"scrapinghub","isFork":false,"description":"Visual scraping for Scrapy","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":19,"issueCount":112,"starsCount":9228,"forksCount":1412,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-26T19:43:46.854Z"}},{"type":"Public","name":"sklearn-crfsuite","owner":"scrapinghub","isFork":true,"description":"scikit-learn inspired API for CRFsuite","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":217,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-18T11:07:35.595Z"}},{"type":"Public","name":"webstruct-demo","owner":"scrapinghub","isFork":false,"description":"HTTP demo for https://github.com/scrapinghub/webstruct","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":0,"starsCount":4,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-17T22:51:03.946Z"}},{"type":"Public","name":"autologin","owner":"scrapinghub","isFork":true,"description":"A project to attempt to automatically login to a website given a single seed","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":9,"forksCount":43,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-17T22:40:10.253Z"}},{"type":"Public","name":"python-intercom","owner":"scrapinghub","isFork":true,"description":"Python wrapper for the Intercom API.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":1,"forksCount":145,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-17T21:39:32.494Z"}},{"type":"Public","name":"python-crfsuite","owner":"scrapinghub","isFork":false,"description":"A python binding for crfsuite","allTopics":["data-science","crf","crfsuite"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":49,"starsCount":768,"forksCount":223,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-12T21:35:11.761Z"}},{"type":"Public","name":"luigi","owner":"scrapinghub","isFork":true,"description":"Luigi is a Python module that helps you build complex pipelines of batch jobs. It handles dependency resolution, workflow management, visualization etc. It also comes with Hadoop support built in. ","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":4,"forksCount":2377,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-07T00:00:29.945Z"}},{"type":"Public","name":"splash","owner":"scrapinghub","isFork":false,"description":"Lightweight, scriptable browser as a service with an HTTP API","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":25,"issueCount":378,"starsCount":4043,"forksCount":508,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-06T21:52:51.801Z"}},{"type":"Public","name":"mrjob","owner":"scrapinghub","isFork":true,"description":"Run MapReduce jobs on Hadoop or Amazon Web Services","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":0,"forksCount":588,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-06T21:52:15.634Z"}},{"type":"Public","name":"andi","owner":"scrapinghub","isFork":false,"description":"Library for annotation-based dependency injection","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":3,"starsCount":20,"forksCount":5,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-03T12:30:30.745Z"}},{"type":"Public","name":"extruct","owner":"scrapinghub","isFork":false,"description":"Extract embedded metadata from HTML markup","allTopics":["microformats","semantic-web","rdfa","json-ld","microdata","opengraph","hacktoberfest"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":15,"issueCount":38,"starsCount":830,"forksCount":114,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-29T06:50:38.096Z"}},{"type":"Public","name":"docker-custodian","owner":"scrapinghub","isFork":true,"description":"Keep docker hosts tidy","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":0,"forksCount":50,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T08:47:51.591Z"}},{"type":"Public","name":"aduana","owner":"scrapinghub","isFork":false,"description":"Frontera backend to guide a crawl using PageRank, HITS or other ranking algorithms based on the link structure of the web graph, even when making big crawls (one billion pages).","allTopics":["data-science"],"primaryLanguage":{"name":"C","color":"#555555"},"pullRequestCount":2,"issueCount":9,"starsCount":54,"forksCount":8,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T08:44:12.090Z"}},{"type":"Public","name":"exporters","owner":"scrapinghub","isFork":false,"description":"Exporters is an extensible export pipeline library that supports filter, transform and several sources and destinations","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":5,"starsCount":40,"forksCount":10,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T08:44:05.979Z"}},{"type":"Public","name":"docker-registry","owner":"scrapinghub","isFork":true,"description":"Registry server for Docker (hosting/delivering of repositories and images)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":1,"forksCount":877,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T20:18:28.198Z"}},{"type":"Public","name":"scrapy-monkeylearn","owner":"scrapinghub","isFork":true,"description":"A Scrapy pipeline to categorize items using MonkeyLearn","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":7,"forksCount":13,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-14T22:15:33.084Z"}},{"type":"Public","name":"tutorials","owner":"scrapinghub","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":8,"forksCount":6,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-14T22:15:19.591Z"}},{"type":"Public","name":"custom-images-examples","owner":"scrapinghub","isFork":false,"description":"Examples of custom images running on Scrapinghub platform","allTopics":[],"primaryLanguage":null,"pullRequestCount":1,"issueCount":0,"starsCount":3,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-14T01:33:51.993Z"}}],"repositoryCount":183,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"scrapinghub repositories"}