{"payload":{"pageCount":7,"repositories":[{"type":"Public","name":"shub-workflow","owner":"scrapinghub","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":2,"starsCount":13,"forksCount":13,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-29T18:36:40.869Z"}},{"type":"Public","name":"extruct","owner":"scrapinghub","isFork":false,"description":"Extract embedded metadata from HTML markup","allTopics":["microformats","semantic-web","rdfa","json-ld","microdata","opengraph","hacktoberfest"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":15,"issueCount":38,"starsCount":828,"forksCount":114,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-29T06:50:38.096Z"}},{"type":"Public","name":"scrapy-poet","owner":"scrapinghub","isFork":false,"description":"Page Object pattern for Scrapy","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":5,"issueCount":9,"starsCount":112,"forksCount":28,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-27T13:42:33.443Z"}},{"type":"Public","name":"docker-custodian","owner":"scrapinghub","isFork":true,"description":"Keep docker hosts tidy","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":0,"forksCount":50,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T08:47:51.591Z"}},{"type":"Public","name":"python-intercom","owner":"scrapinghub","isFork":true,"description":"Python wrapper for the Intercom API.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":1,"forksCount":144,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T08:44:32.585Z"}},{"type":"Public","name":"aduana","owner":"scrapinghub","isFork":false,"description":"Frontera backend to guide a crawl using PageRank, HITS or other ranking algorithms based on the link structure of the web graph, even when making big crawls (one billion pages).","allTopics":["data-science"],"primaryLanguage":{"name":"C","color":"#555555"},"pullRequestCount":2,"issueCount":9,"starsCount":53,"forksCount":8,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T08:44:12.090Z"}},{"type":"Public","name":"exporters","owner":"scrapinghub","isFork":false,"description":"Exporters is an extensible export pipeline library that supports filter, transform and several sources and destinations","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":5,"starsCount":40,"forksCount":10,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T08:44:05.979Z"}},{"type":"Public","name":"scrapinghub-stack-scrapy","owner":"scrapinghub","isFork":false,"description":"Software stack with latest Scrapy and updated deps","allTopics":[],"primaryLanguage":{"name":"Dockerfile","color":"#384d54"},"pullRequestCount":3,"issueCount":1,"starsCount":62,"forksCount":23,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T05:58:31.528Z"}},{"type":"Public","name":"webstruct-demo","owner":"scrapinghub","isFork":false,"description":"HTTP demo for https://github.com/scrapinghub/webstruct","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":0,"starsCount":4,"forksCount":2,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T21:10:34.433Z"}},{"type":"Public","name":"autologin","owner":"scrapinghub","isFork":true,"description":"A project to attempt to automatically login to a website given a single seed","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":8,"forksCount":43,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T20:22:33.246Z"}},{"type":"Public","name":"docker-registry","owner":"scrapinghub","isFork":true,"description":"Registry server for Docker (hosting/delivering of repositories and images)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":1,"forksCount":875,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T20:18:28.198Z"}},{"type":"Public","name":"spidermon","owner":"scrapinghub","isFork":false,"description":"Scrapy Extension for monitoring spiders execution.","allTopics":["testing","monitoring","scraping","crawling","spiders","hacktoberfest","monitoring-tool","scrapinghub"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":38,"starsCount":515,"forksCount":92,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":[0,0,0,2,4,0,2,0,0,4,0,0,9,1,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,1,0,0,4,0,0,0,0,0,2,1,0,6,1,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-16T12:22:07.085Z"}},{"type":"Public","name":"portia","owner":"scrapinghub","isFork":false,"description":"Visual scraping for Scrapy","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":18,"issueCount":112,"starsCount":9205,"forksCount":1410,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-14T22:19:52.320Z"}},{"type":"Public","name":"shublang","owner":"scrapinghub","isFork":false,"description":"Pluggable DSL that uses pipes to perform a series of linear transformations to extract data","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":23,"starsCount":15,"forksCount":8,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-14T22:16:36.110Z"}},{"type":"Public","name":"scrapy-monkeylearn","owner":"scrapinghub","isFork":true,"description":"A Scrapy pipeline to categorize items using MonkeyLearn","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":7,"forksCount":13,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-14T22:15:33.084Z"}},{"type":"Public","name":"tutorials","owner":"scrapinghub","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":7,"forksCount":6,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-14T22:15:19.591Z"}},{"type":"Public","name":"custom-images-examples","owner":"scrapinghub","isFork":false,"description":"Examples of custom images running on Scrapinghub platform","allTopics":[],"primaryLanguage":null,"pullRequestCount":1,"issueCount":0,"starsCount":3,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-14T01:33:51.993Z"}},{"type":"Public","name":"number-parser","owner":"scrapinghub","isFork":false,"description":"Parse numbers written in natural language","allTopics":["hacktoberfest"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":13,"starsCount":103,"forksCount":22,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-13T13:44:08.109Z"}},{"type":"Public","name":"mrjob","owner":"scrapinghub","isFork":true,"description":"Run MapReduce jobs on Hadoop or Amazon Web Services","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":0,"forksCount":591,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-06T16:58:21.666Z"}},{"type":"Public","name":"pastebin","owner":"scrapinghub","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":7,"forksCount":3,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-06T15:44:06.978Z"}},{"type":"Public","name":"woodpecker","owner":"scrapinghub","isFork":true,"description":"An opinionated fork of the Drone CI system","allTopics":[],"primaryLanguage":{"name":"Go","color":"#00ADD8"},"pullRequestCount":4,"issueCount":0,"starsCount":0,"forksCount":332,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-06T15:25:48.219Z"}},{"type":"Public","name":"Zappa","owner":"scrapinghub","isFork":true,"description":"Serverless Python Web Services","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":3,"forksCount":1207,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-06T14:35:42.245Z"}},{"type":"Public","name":"shub","owner":"scrapinghub","isFork":false,"description":"Scrapinghub Command Line Client","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":14,"issueCount":44,"starsCount":125,"forksCount":79,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-03T20:09:59.645Z"}},{"type":"Public","name":"webstruct","owner":"scrapinghub","isFork":false,"description":"NER toolkit for HTML data","allTopics":["data-science","ner","crfsuite"],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":10,"issueCount":13,"starsCount":255,"forksCount":59,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-03T19:37:19.901Z"}},{"type":"Public","name":"varanus","owner":"scrapinghub","isFork":false,"description":"A command line spider monitoring tool","allTopics":["spider","monitoring","python36"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":2,"starsCount":7,"forksCount":6,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-01T14:34:22.771Z"}},{"type":"Public","name":"product-extraction-benchmark","owner":"scrapinghub","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":16,"forksCount":1,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-24T09:58:12.207Z"}},{"type":"Public","name":"article-extraction-benchmark","owner":"scrapinghub","isFork":false,"description":"Article extraction benchmark: dataset and evaluation scripts","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":255,"forksCount":28,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-24T09:57:59.039Z"}},{"type":"Public","name":"autoextract-examples","owner":"scrapinghub","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":4,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-24T09:57:44.636Z"}},{"type":"Public","name":"spark","owner":"scrapinghub","isFork":true,"description":"Mirror of Apache Spark","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":1,"issueCount":0,"starsCount":1,"forksCount":28000,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-24T09:09:22.924Z"}},{"type":"Public","name":"tabix","owner":"scrapinghub","isFork":true,"description":"Tabix.io UI","allTopics":[],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":1,"issueCount":0,"starsCount":1,"forksCount":264,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-24T09:07:43.746Z"}}],"repositoryCount":182,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}