diff --git a/.github/workflows/check-links.yml b/.github/workflows/check-links.yml new file mode 100644 index 0000000..7a2d0c5 --- /dev/null +++ b/.github/workflows/check-links.yml @@ -0,0 +1,18 @@ +name: Check for broken links +on: + push: + branches: [ main, master ] + pull_request: + branches: [ main, master ] + schedule: + - cron: '0 9 * * 1' +jobs: + check-links: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v4 + - name: Link Checker + uses: lycheeverse/lychee-action@v1.8.0 + with: + args: --verbose --max-retries 3 --timeout 10 '**/*.html' '**/*.md' + fail: true diff --git a/README.md b/README.md index fd9f008..de55b14 100644 --- a/README.md +++ b/README.md @@ -487,6 +487,7 @@ * [cleanlab](https://github.com/cleanlab/cleanlab) - The standard data-centric AI package for data quality and machine learning with messy, real-world data and labels. * [snorkel](https://github.com/snorkel-team/snorkel) - A system for quickly generating training data with weak supervision. * [dataprep](https://github.com/sfu-db/dataprep) - Collect, clean, and visualize your data in Python with a few lines of code. +* [latamdata-py](https://github.com/juanmoisesd/latamdata-py) - One-line access to 38 open research datasets from Latin America (health, neuroscience, mental health, economics). Real-world data for research and ML. ### Synthetic Data