{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"oas","owner":"TextCorpusLabs","isFork":false,"description":"Walk through to convert PMC OAS Dataset into a text corpus","allTopics":["python3","oas","text-corpus"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-25T10:29:32.419Z"}},{"type":"Public","name":"Edgar","owner":"TextCorpusLabs","isFork":false,"description":"Create a corpus from EDGAR data","allTopics":["corpus","python3","edgar-scraper"],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-20T17:32:02.655Z"}},{"type":"Public","name":"metadiscourse","owner":"TextCorpusLabs","isFork":false,"description":"Template code for a Metadiscourse analysis","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-16T00:52:41.667Z"}},{"type":"Public","name":"wikimedia","owner":"TextCorpusLabs","isFork":false,"description":"Walk through to convert WikiMedia into a text corpus","allTopics":["wikimedia","python3","text-corpus"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":1,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-26T20:31:39.723Z"}},{"type":"Public","name":"VLNGramCounter","owner":"TextCorpusLabs","isFork":false,"description":"NGram counter for large datasets","allTopics":["ngrams","python"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-20T13:38:30.059Z"}},{"type":"Public","name":"building-blocks","owner":"TextCorpusLabs","isFork":false,"description":"Building blocks for text pre-processing","allTopics":["python3","text-processing"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-10-05T11:51:11.133Z"}},{"type":"Public","name":"NJGovNews","owner":"TextCorpusLabs","isFork":false,"description":"Web scraping of the New Jersey news feeds","allTopics":["python3","newsfeed","text-corpus"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-03-10T22:43:19.877Z"}},{"type":"Public","name":"congressional-votes","owner":"TextCorpusLabs","isFork":false,"description":"Walk through to convert congressional roll call votes into a text corpus","allTopics":["python3","us-congress","text-corpus","congress-votes"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-01-21T18:02:31.503Z"}},{"type":"Public","name":"getting-started","owner":"TextCorpusLabs","isFork":false,"description":"Getting started at Text Corpus Labs","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-11-19T17:16:07.436Z"}},{"type":"Public","name":"covid19","owner":"TextCorpusLabs","isFork":false,"description":"Walk through to convert Kaggle's COVID-19 Open Research Dataset Challenge into a text corpus","allTopics":["python3","covid-19","text-corpus"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-03-23T21:39:54.321Z"}},{"type":"Public archive","name":"ScrapeSecEdgar","owner":"TextCorpusLabs","isFork":false,"description":"Pulls down all the SEC filings from EDGAR by filing type for a given time range","allTopics":["scraper","edgar"],"primaryLanguage":{"name":"C#","color":"#178600"},"pullRequestCount":0,"issueCount":0,"starsCount":6,"forksCount":0,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-01-18T22:53:23.386Z"}}],"repositoryCount":11,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}