From 8da67855da0374cdfee1c888fc4ca7aee4b572b8 Mon Sep 17 00:00:00 2001 From: Juan Moises de la Serna Date: Wed, 1 Apr 2026 04:18:04 +0200 Subject: [PATCH 1/2] Add latamdata-py to Data-centric AI section --- README.md | 1 + 1 file changed, 1 insertion(+) diff --git a/README.md b/README.md index fd9f008..de55b14 100644 --- a/README.md +++ b/README.md @@ -487,6 +487,7 @@ * [cleanlab](https://github.com/cleanlab/cleanlab) - The standard data-centric AI package for data quality and machine learning with messy, real-world data and labels. * [snorkel](https://github.com/snorkel-team/snorkel) - A system for quickly generating training data with weak supervision. * [dataprep](https://github.com/sfu-db/dataprep) - Collect, clean, and visualize your data in Python with a few lines of code. +* [latamdata-py](https://github.com/juanmoisesd/latamdata-py) - One-line access to 38 open research datasets from Latin America (health, neuroscience, mental health, economics). Real-world data for research and ML. ### Synthetic Data From 86363bc4b6befe20f206559a7d90cb215a2e6304 Mon Sep 17 00:00:00 2001 From: Juan Moises de la Serna Date: Wed, 1 Apr 2026 20:44:36 +0200 Subject: [PATCH 2/2] Create check-links.yml --- .github/workflows/check-links.yml | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) create mode 100644 .github/workflows/check-links.yml diff --git a/.github/workflows/check-links.yml b/.github/workflows/check-links.yml new file mode 100644 index 0000000..7a2d0c5 --- /dev/null +++ b/.github/workflows/check-links.yml @@ -0,0 +1,18 @@ +name: Check for broken links +on: + push: + branches: [ main, master ] + pull_request: + branches: [ main, master ] + schedule: + - cron: '0 9 * * 1' +jobs: + check-links: + runs-on: ubuntu-latest + steps: + - uses: actions/checkout@v4 + - name: Link Checker + uses: lycheeverse/lychee-action@v1.8.0 + with: + args: --verbose --max-retries 3 --timeout 10 '**/*.html' '**/*.md' + fail: true