{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"system-metrics","owner":"mediacloud","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-28T23:50:47.665Z"}},{"type":"Public","name":"sous-chef","owner":"mediacloud","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":1,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-27T19:20:50.198Z"}},{"type":"Public","name":"story-indexer","owner":"mediacloud","isFork":false,"description":"The core pipeline used to ingest online news stories in the Media Cloud archive.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":32,"starsCount":1,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-28T12:47:15.871Z"}},{"type":"Public","name":"news-search-api","owner":"mediacloud","isFork":false,"description":"Internal API server that offers search access to the Media Cloud Online News Archive (in Elasticsearch).","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":1,"forksCount":3,"license":"GNU Affero General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-25T22:36:59.947Z"}},{"type":"Public","name":"mc-manage","owner":"mediacloud","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-25T20:35:11.721Z"}},{"type":"Public","name":"rss-fetcher","owner":"mediacloud","isFork":false,"description":"Intelligently fetch lists of URLs from a large collection of RSS Feeds as part of the Media Cloud Directory.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":13,"starsCount":5,"forksCount":5,"license":"Apache License 2.0","participation":[0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,10,0,1,0,0,0,0,0,0,0,0,0,0,0,1,0,8,2,2,0,0,1,5,3,0,1,0,0,0,1,0,1,0,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-02T19:27:39.145Z"}},{"type":"Public","name":"mc-providers","owner":"mediacloud","isFork":false,"description":"Internal library to allow querying multiple media platforms with a consistent API.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":0,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-11T13:45:18.070Z"}},{"type":"Public","name":"api-client","owner":"mediacloud","isFork":false,"description":"Public client for consuming content from the Media Cloud Online News Archive & Directory.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":1,"starsCount":67,"forksCount":24,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-07T22:20:57.613Z"}},{"type":"Public","name":"metadata-lib","owner":"mediacloud","isFork":false,"description":"How Media Cloud approaches extracting metadata from online news stories","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":11,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-07T22:00:47.310Z"}},{"type":"Public","name":"mediacloud-news-client","owner":"mediacloud","isFork":true,"description":"An internal client library to access the new Mediacloud news archive search.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":2,"starsCount":0,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-14T20:42:17.369Z"}},{"type":"Public","name":"wayback-news-client","owner":"mediacloud","isFork":false,"description":"A client library to access the Wayback Machine news archive search.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":4,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-15T14:56:17.823Z"}},{"type":"Public archive","name":"backend","owner":"mediacloud","isFork":false,"description":"Media Cloud is an open source, open data platform that allows researchers to answer quantitative questions about the content of online media.","allTopics":["media","newspaper","content-analysis","news-media","newsmedia","online-news"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":25,"issueCount":131,"starsCount":276,"forksCount":87,"license":"GNU Affero General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-20T07:57:58.179Z"}},{"type":"Public","name":"cliff-api-client","owner":"mediacloud","isFork":false,"description":"A Python client for the CLIFF geoparsing tool","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":5,"forksCount":5,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-21T05:31:17.202Z"}},{"type":"Public","name":"ultimate-sitemap-parser","owner":"mediacloud","isFork":false,"description":"Ultimate Website Sitemap Parser","allTopics":["python","sitemap","python3","robots-txt","python-3","xml-sitemap","sitemap-xml","xml-sitemap-parser"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":4,"issueCount":18,"starsCount":173,"forksCount":64,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-05-17T11:16:44.996Z"}},{"type":"Public","name":"nyt-news-labeler","owner":"mediacloud","isFork":false,"description":"Tag news stories based on models trained on the NYT corpus.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":1,"starsCount":39,"forksCount":12,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-03-01T18:34:46.754Z"}},{"type":"Public","name":"feed_seeker","owner":"mediacloud","isFork":false,"description":"Find rss, atom, xml, and rdf feeds on webpages","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":4,"starsCount":30,"forksCount":12,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-02-27T06:13:52.547Z"}},{"type":"Public","name":"sentence-splitter","owner":"mediacloud","isFork":false,"description":"Text to sentence splitter using heuristic algorithm by Philipp Koehn and Josh Schroeder.","allTopics":["nlp","tokenizer","sentence-splitting"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":2,"starsCount":221,"forksCount":29,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-11-07T22:32:41.511Z"}},{"type":"Public archive","name":"glimpse","owner":"mediacloud","isFork":false,"description":"Get a glimpse of attention to a topic on social media.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":8,"starsCount":2,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-09-19T13:01:39.422Z"}},{"type":"Public archive","name":"word-embeddings-server","owner":"mediacloud","isFork":false,"description":"Helpful micro-service to return results from word2vec models","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":4,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-07-29T15:37:22.842Z"}},{"type":"Public archive","name":"fernandos-smart-status-aggregator","owner":"mediacloud","isFork":false,"description":"Check SMART status with smartctl on multiple servers, get an aggregate CSV, ???, profit!","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-09-02T11:50:26.274Z"}},{"type":"Public","name":"nytlabels-annotator-train","owner":"mediacloud","isFork":true,"description":"(Probably) NYTLabels annotator training scripts and data.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":2,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-12-07T19:57:27.707Z"}},{"type":"Public","name":"corenlp-docker","owner":"mediacloud","isFork":true,"description":"build/run the most current Stanford CoreNLP server in a docker container","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":31,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-11-20T10:39:46.185Z"}},{"type":"Public","name":"docker-compose-just-quieter","owner":"mediacloud","isFork":false,"description":"Docker Compose CLI utility wrapper which makes `docker-compose` quieter.","allTopics":["docker","docker-compose"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-09-08T19:34:56.086Z"}},{"type":"Public","name":"fernandos-csv-randomizer","owner":"mediacloud","isFork":false,"description":"Fernando's CSV randomizer -- reads a CSV file, picks a specified number of random rows and writes them to a separate file","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-09-08T19:01:34.717Z"}},{"type":"Public","name":"topic2kibana","owner":"mediacloud","isFork":false,"description":"This is a simple utility for automating the import of content from a Media Cloud topic version into Kibana for analysis.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-06-16T20:09:59.897Z"}},{"type":"Public","name":"date_guesser","owner":"mediacloud","isFork":false,"description":"A library to extract a publication date from a web page, along with a measure of the accuracy.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":42,"forksCount":7,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-08-13T16:09:29.172Z"}},{"type":"Public","name":"hausastemmer","owner":"mediacloud","isFork":false,"description":"Hausa language stemmer (Bimba et al., 2015)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2017-09-07T13:36:53.195Z"}}],"repositoryCount":27,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}