From 672c258f59039ae5714361571609a07168fbb14f Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Fri, 22 Sep 2023 20:19:20 +0530 Subject: [PATCH 01/49] Create broken-linkcheck.yml Created a Github Action to run the Sphinx linkcheck monthly. #45409 --- .github/workflows/broken-linkcheck.yml | 28 ++++++++++++++++++++++++++ 1 file changed, 28 insertions(+) create mode 100644 .github/workflows/broken-linkcheck.yml diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml new file mode 100644 index 0000000000000..9075e8d13afcd --- /dev/null +++ b/.github/workflows/broken-linkcheck.yml @@ -0,0 +1,28 @@ +name: Broken linkcheck +on: + schedule: + # Run monthly on the 1st day of the month + - cron: '0 0 1 * *' +jobs: + linkcheck: + runs-on: ubuntu-latest + + steps: + - name: Checkout + uses: actions/checkout@v4 + with: + fetch-depth: 0 + + - name: Setup Python + id: setup_python + uses: actions/setup-python@v4 + with: + python-version: '3.10' + cache: 'pip' + cache-dependency-path: 'requirements-dev.txt' + + - name: Install requirements-dev.txt + run: pip install -r requirements-dev.txt + + - name: Run linkcheck script + run: python make.py linkcheck From f355cdff8e50ad144994c3831f2328c4953c23b9 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Sat, 23 Sep 2023 11:49:47 +0530 Subject: [PATCH 02/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 9075e8d13afcd..b65d5c9277b59 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -1,8 +1,9 @@ name: Broken linkcheck on: - schedule: + workflow_dispatch: # Enable manual triggering + #schedule: # Run monthly on the 1st day of the month - - cron: '0 0 1 * *' + #- cron: '0 0 1 * *' jobs: linkcheck: runs-on: ubuntu-latest From a8fc4bd5774cfb56ba0bd1f58637f761e034275c Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Sat, 23 Sep 2023 12:46:55 +0530 Subject: [PATCH 03/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index b65d5c9277b59..9c430df6844d2 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -1,3 +1,4 @@ +--- name: Broken linkcheck on: workflow_dispatch: # Enable manual triggering From d7d9ba0ef62297e95169b39e951c86daa0805969 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Sat, 23 Sep 2023 14:53:42 +0530 Subject: [PATCH 04/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 9c430df6844d2..52ad6063dfd41 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -17,7 +17,7 @@ jobs: - name: Setup Python id: setup_python - uses: actions/setup-python@v4 + uses: actions/setup-python@v4 with: python-version: '3.10' cache: 'pip' @@ -27,4 +27,4 @@ jobs: run: pip install -r requirements-dev.txt - name: Run linkcheck script - run: python make.py linkcheck + run: python make.py linkcheck From 53f7a2e4dab35650c041f85e4fc193e7597b1fda Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Sat, 23 Sep 2023 20:55:29 +0530 Subject: [PATCH 05/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 52ad6063dfd41..04ba8f05d7713 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -8,12 +8,12 @@ on: jobs: linkcheck: runs-on: ubuntu-latest - + steps: - name: Checkout uses: actions/checkout@v4 with: - fetch-depth: 0 + fetch-depth: 0 - name: Setup Python id: setup_python From 6987819c8eaa5cc30ae420a8ea5df510bbde6548 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Sat, 23 Sep 2023 23:34:39 +0530 Subject: [PATCH 06/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 04ba8f05d7713..966384792a5de 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -4,7 +4,7 @@ on: workflow_dispatch: # Enable manual triggering #schedule: # Run monthly on the 1st day of the month - #- cron: '0 0 1 * *' + #- cron: '0 0 1 * *' jobs: linkcheck: runs-on: ubuntu-latest @@ -13,7 +13,7 @@ jobs: - name: Checkout uses: actions/checkout@v4 with: - fetch-depth: 0 + fetch-depth: 0 - name: Setup Python id: setup_python @@ -24,7 +24,7 @@ jobs: cache-dependency-path: 'requirements-dev.txt' - name: Install requirements-dev.txt - run: pip install -r requirements-dev.txt + run: pip install -r requirements-dev.txt - name: Run linkcheck script run: python make.py linkcheck From 2d15e1fae5494422ebd3131d775da7bf2e472ecf Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Mon, 25 Sep 2023 15:54:53 +0530 Subject: [PATCH 07/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Philip Meier --- .github/workflows/broken-linkcheck.yml | 1 - 1 file changed, 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 966384792a5de..e2e9550099df1 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -1,4 +1,3 @@ ---- name: Broken linkcheck on: workflow_dispatch: # Enable manual triggering From 4e4061100c686caca17068462fcc184a50a04f36 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Mon, 25 Sep 2023 15:55:25 +0530 Subject: [PATCH 08/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Philip Meier --- .github/workflows/broken-linkcheck.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index e2e9550099df1..9a9ee65363e08 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -1,4 +1,4 @@ -name: Broken linkcheck +name: Linkcheck on: workflow_dispatch: # Enable manual triggering #schedule: From d486c3ea25662f7111e174aa8e41e88b7c296fc8 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Mon, 25 Sep 2023 15:58:09 +0530 Subject: [PATCH 09/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Philip Meier --- .github/workflows/broken-linkcheck.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 9a9ee65363e08..36fa9c60cdcd6 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -26,4 +26,5 @@ jobs: run: pip install -r requirements-dev.txt - name: Run linkcheck script + working-directory: ./doc run: python make.py linkcheck From 69eaa34046611fe981c53b831a691dd65df5cf21 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Mon, 25 Sep 2023 16:00:27 +0530 Subject: [PATCH 10/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Philip Meier --- .github/workflows/broken-linkcheck.yml | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 36fa9c60cdcd6..9f84f5e6ce0f2 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -4,6 +4,10 @@ on: #schedule: # Run monthly on the 1st day of the month #- cron: '0 0 1 * *' + pull_request: + paths: + - ".github/workflows/broken-linkcheck.yml" + - "doc/make.py" jobs: linkcheck: runs-on: ubuntu-latest From 86b7c9cec44dd453aee33a9301fc6713f568a258 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Mon, 25 Sep 2023 16:08:00 +0530 Subject: [PATCH 11/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 9f84f5e6ce0f2..172b461eaf609 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -7,7 +7,7 @@ on: pull_request: paths: - ".github/workflows/broken-linkcheck.yml" - - "doc/make.py" + - "doc/make.py" jobs: linkcheck: runs-on: ubuntu-latest From a037a9bb42d0921d66f287e3453771866cb5f685 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Mon, 25 Sep 2023 19:49:14 +0530 Subject: [PATCH 12/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 172b461eaf609..36b971daf12a4 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -17,6 +17,12 @@ jobs: uses: actions/checkout@v4 with: fetch-depth: 0 + + - name: Set up Conda + uses: ./.github/actions/setup-conda + + - name: Build Pandas + uses: ./.github/actions/build_pandas - name: Setup Python id: setup_python From fc821e54244d15c94eef8176ae74928d6c5e6268 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Mon, 25 Sep 2023 20:01:43 +0530 Subject: [PATCH 13/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 36b971daf12a4..80c3ee017a9c8 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -17,7 +17,7 @@ jobs: uses: actions/checkout@v4 with: fetch-depth: 0 - + - name: Set up Conda uses: ./.github/actions/setup-conda From a902099e533988059ad61f25f9e1fc9007372903 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Mon, 25 Sep 2023 21:06:34 +0530 Subject: [PATCH 14/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Philip Meier --- .github/workflows/broken-linkcheck.yml | 10 ---------- 1 file changed, 10 deletions(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 80c3ee017a9c8..dddaf87083619 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -24,16 +24,6 @@ jobs: - name: Build Pandas uses: ./.github/actions/build_pandas - - name: Setup Python - id: setup_python - uses: actions/setup-python@v4 - with: - python-version: '3.10' - cache: 'pip' - cache-dependency-path: 'requirements-dev.txt' - - - name: Install requirements-dev.txt - run: pip install -r requirements-dev.txt - name: Run linkcheck script working-directory: ./doc From 8484c630aa685b7d03094dca0834a1785a910e11 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Tue, 26 Sep 2023 19:50:01 +0530 Subject: [PATCH 15/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 3 +++ 1 file changed, 3 insertions(+) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index dddaf87083619..2d783963bd21a 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -11,6 +11,9 @@ on: jobs: linkcheck: runs-on: ubuntu-latest + defaults: + run: + shell: bash -el {0} steps: - name: Checkout From d56f2c55c6452b239f26c6cafe4ebefaa96e35b8 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 28 Sep 2023 15:17:01 +0530 Subject: [PATCH 16/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Philip Meier --- .github/workflows/broken-linkcheck.yml | 1 - 1 file changed, 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 2d783963bd21a..2b0b3e72e2cf2 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -27,7 +27,6 @@ jobs: - name: Build Pandas uses: ./.github/actions/build_pandas - - name: Run linkcheck script working-directory: ./doc run: python make.py linkcheck From b50eea26bf69b8738b440668ea1c4237b2f88c04 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 28 Sep 2023 15:34:14 +0530 Subject: [PATCH 17/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Philip Meier --- .github/workflows/broken-linkcheck.yml | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 2b0b3e72e2cf2..2a013aab3cc5a 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -29,4 +29,9 @@ jobs: - name: Run linkcheck script working-directory: ./doc - run: python make.py linkcheck + run: python make.py linkcheck | tee linkcheck.txt + + - name: Display broken links + if: failure() + working-directory: ./doc + run: grep broken linkcheck.txt From 60f16551e38ff64a483a4663ce99da88829bc4a4 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 28 Sep 2023 15:37:47 +0530 Subject: [PATCH 18/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 2a013aab3cc5a..5e08d499d53ea 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -34,4 +34,4 @@ jobs: - name: Display broken links if: failure() working-directory: ./doc - run: grep broken linkcheck.txt + run: grep -i broken linkcheck.txt From 3a35cd65dd0bf1d29e86ad161f43eeaa2879d0cf Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 28 Sep 2023 15:50:46 +0530 Subject: [PATCH 19/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 5e08d499d53ea..58d470312e86f 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -30,8 +30,8 @@ jobs: - name: Run linkcheck script working-directory: ./doc run: python make.py linkcheck | tee linkcheck.txt - + - name: Display broken links if: failure() working-directory: ./doc - run: grep -i broken linkcheck.txt + run: linkcheck.txt grep -i broken From a60215341f6a244e56627d4832e90018a191ae5e Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 28 Sep 2023 20:54:00 +0530 Subject: [PATCH 20/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Philip Meier --- .github/workflows/broken-linkcheck.yml | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 58d470312e86f..141fb7984afa3 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -29,7 +29,10 @@ jobs: - name: Run linkcheck script working-directory: ./doc - run: python make.py linkcheck | tee linkcheck.txt + shell: bash + run: | + set -o pipefail + python make.py linkcheck | tee linkcheck.txt - name: Display broken links if: failure() From ef26ad7b73a59020a0ab679df1380b19b0da728f Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Fri, 29 Sep 2023 15:20:40 +0530 Subject: [PATCH 21/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 9 +++++---- 1 file changed, 5 insertions(+), 4 deletions(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 141fb7984afa3..acac867245aa3 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -1,9 +1,10 @@ name: Linkcheck on: - workflow_dispatch: # Enable manual triggering - #schedule: + workflow_dispatch: + # Enable manual triggering + schedule: # Run monthly on the 1st day of the month - #- cron: '0 0 1 * *' + - cron: '0 0 1 * *' pull_request: paths: - ".github/workflows/broken-linkcheck.yml" @@ -37,4 +38,4 @@ jobs: - name: Display broken links if: failure() working-directory: ./doc - run: linkcheck.txt grep -i broken + run: grep broken linkcheck.txt From 55afa65d9f07d81e317086cd26410373d09118c9 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 5 Oct 2023 19:37:38 +0530 Subject: [PATCH 22/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Philip Meier --- .github/workflows/broken-linkcheck.yml | 1 - 1 file changed, 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index acac867245aa3..067bcda7a2eb2 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -30,7 +30,6 @@ jobs: - name: Run linkcheck script working-directory: ./doc - shell: bash run: | set -o pipefail python make.py linkcheck | tee linkcheck.txt From 84fe04c39fe30eac25df9dc658e1d2b8197c5b07 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Tue, 10 Oct 2023 19:25:14 +0530 Subject: [PATCH 23/49] Update conf.py Added Ignore list for broken link checks --- doc/source/conf.py | 32 ++++++++++++++++++++++++++++++++ 1 file changed, 32 insertions(+) diff --git a/doc/source/conf.py b/doc/source/conf.py index accbff596b12d..ff993a5bc9dd8 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -798,3 +798,35 @@ def setup(app): app.add_autodocumenter(AccessorMethodDocumenter) app.add_autodocumenter(AccessorCallableDocumenter) app.add_directive("autosummary", PandasAutosummary) + + +#### Ignore list for broken link checks + +import re +import requests + +# Fetch the content of the ci file +pipeline_url = ("https://pipelinesghubeus22.actions.githubusercontent.com/" + "xZyE9jtmkxWlfCAbyu1SHPJOlsa2huNFYcxohSTomy6EbdNZT9/" + "_apis/pipelines/1/runs/531865/signedlogcontent/2?" + "urlExpires=2023-10-08T10%3A02%3A18.0563894Z&" + "urlSigningMethod=HMACV1&" + "urlSignature=9icPkVbCE2Ya0M5%2FY03N8fkFuDfYBn%2F" + "DyJ93o2R4%2BWk%3D") + +response = requests.get(pipeline_url) +ignore_patterns = response.text.splitlines() + +# List to store broken links +broken_links = [] + +# Ignore links based on patterns from ci file +for pattern in ignore_patterns: + # Compile the regular expression pattern + regex_pattern = re.compile(pattern) + + # Check if any broken link matches the pattern + ignored_links = [link for link in broken_links if regex_pattern.search(link)] + + print(f"Ignored links matching pattern {pattern}:") + print(ignored_links) From 11935673fa3f0bd76366bcb1aa001215c0349b1f Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 12 Oct 2023 21:47:48 +0530 Subject: [PATCH 24/49] Update conf.py #55246 This is an ignore list for broken links found in CI run checks for broken-linkcheck.yml --- doc/source/conf.py | 65 +++++++++++++++++++++++++--------------------- 1 file changed, 35 insertions(+), 30 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index ff993a5bc9dd8..3cb90890f5677 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -800,33 +800,38 @@ def setup(app): app.add_directive("autosummary", PandasAutosummary) -#### Ignore list for broken link checks - -import re -import requests - -# Fetch the content of the ci file -pipeline_url = ("https://pipelinesghubeus22.actions.githubusercontent.com/" - "xZyE9jtmkxWlfCAbyu1SHPJOlsa2huNFYcxohSTomy6EbdNZT9/" - "_apis/pipelines/1/runs/531865/signedlogcontent/2?" - "urlExpires=2023-10-08T10%3A02%3A18.0563894Z&" - "urlSigningMethod=HMACV1&" - "urlSignature=9icPkVbCE2Ya0M5%2FY03N8fkFuDfYBn%2F" - "DyJ93o2R4%2BWk%3D") - -response = requests.get(pipeline_url) -ignore_patterns = response.text.splitlines() - -# List to store broken links -broken_links = [] - -# Ignore links based on patterns from ci file -for pattern in ignore_patterns: - # Compile the regular expression pattern - regex_pattern = re.compile(pattern) - - # Check if any broken link matches the pattern - ignored_links = [link for link in broken_links if regex_pattern.search(link)] - - print(f"Ignored links matching pattern {pattern}:") - print(ignored_links) +####### This is an ignore list for broken links found in CI run checks for broken-linkcheck.yml + +linkcheck_ignore = [r'http://'] +linkcheck_ignore = [r'http://scatterci.github.io/pydata/pandas:\d+/'] +linkcheck_ignore = [r'http://specs.frictionlessdata.io/json-table-schema/:\d+/'] +linkcheck_ignore = [r'https://'] +linkcheck_ignore = [r'https://cloud.google.com/bigquery/docs/access-control#roles:\d+/'] +linkcheck_ignore = [r'https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query:\d+/'] +linkcheck_ignore = [r'https://crates.io/crates/calamine:\d+/'] +linkcheck_ignore = [r'https://devguide.python.org/setup/#macos:\d+/'] +linkcheck_ignore = [r'https://en.wikipedia.org/wiki/Imputation_(statistics:\d+/'] +linkcheck_ignore = [r'https://github.com/noatamir/pandas-dev:\d+/'] +linkcheck_ignore = [r'https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1:\d+/'] +linkcheck_ignore = [r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568:\d+/'] +linkcheck_ignore = [r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495:\d+/'] +linkcheck_ignore = [r'https://github.com/pandas-dev/pandas/issues/174151:\d+/'] +linkcheck_ignore = [r'https://gitpod.io/#https://github.com/USERNAME/pandas:\d+/'] +linkcheck_ignore = [r'https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/:\d+/'] +linkcheck_ignore = [r'https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table:\d+/'] +linkcheck_ignore = [r'https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html:\d+/'] +linkcheck_ignore = [r'https://nbviewer.ipython.org/gist/metakermit/5720498:\d+/'] +linkcheck_ignore = [r'https://numpy.org/doc/stable/user/basics.byteswapping.html:\d+/'] +linkcheck_ignore = [r'https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0:\d+/'] +linkcheck_ignore = [r'https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking:\d+/'] +linkcheck_ignore = [r'https://pandas.pydata.org/pandas-docs/stable/ecosystem.html:\d+/'] +linkcheck_ignore = [r'https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html:\d+/'] +linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm:\d+/'] +linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm:\d+/'] +linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm:\d+/'] +linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm:\d+/'] +linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm:\d+/'] +linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm:\d+/'] +linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm:\d+/'] +linkcheck_ignore = [r'https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/:\d+/'] +linkcheck_ignore = [r'pandas.zip:\d+/'] From b54a6eb9c064c2d76924f2a35fabf36226994df1 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Fri, 13 Oct 2023 00:47:41 +0530 Subject: [PATCH 25/49] Update doc/source/conf.py Co-authored-by: Philip Meier --- doc/source/conf.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 3cb90890f5677..a055e36acad64 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -802,8 +802,11 @@ def setup(app): ####### This is an ignore list for broken links found in CI run checks for broken-linkcheck.yml -linkcheck_ignore = [r'http://'] -linkcheck_ignore = [r'http://scatterci.github.io/pydata/pandas:\d+/'] +linkcheck_ignore = [ + r'http://', + r'http://scatterci.github.io/pydata/pandas:\d+/' + ... +] linkcheck_ignore = [r'http://specs.frictionlessdata.io/json-table-schema/:\d+/'] linkcheck_ignore = [r'https://'] linkcheck_ignore = [r'https://cloud.google.com/bigquery/docs/access-control#roles:\d+/'] From 787642dbc43fedd8685b5326898b6471f7f1dfd1 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Fri, 13 Oct 2023 01:04:43 +0530 Subject: [PATCH 26/49] Update conf.py --- doc/source/conf.py | 65 +++++++++++++++++++++++----------------------- 1 file changed, 32 insertions(+), 33 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index a055e36acad64..64d421d1c9dea 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -804,37 +804,36 @@ def setup(app): linkcheck_ignore = [ r'http://', - r'http://scatterci.github.io/pydata/pandas:\d+/' - ... + r'http://scatterci.github.io/pydata/pandas', + r'http://specs.frictionlessdata.io/json-table-schema/', + r'https://', + r'https://cloud.google.com/bigquery/docs/access-control#roles', + r'https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query', + r'https://crates.io/crates/calamine', + r'https://devguide.python.org/setup/#macos', + r'https://en.wikipedia.org/wiki/Imputation_(statistics', + r'https://github.com/noatamir/pandas-dev', + r'https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1', + r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568', + r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495', + r'https://github.com/pandas-dev/pandas/issues/174151', + r'https://gitpod.io/#https://github.com/USERNAME/pandas', + r'https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/', + r'https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table', + r'https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html', + r'https://nbviewer.ipython.org/gist/metakermit/5720498', + r'https://numpy.org/doc/stable/user/basics.byteswapping.html', + r'https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0', + r'https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking', + r'https://pandas.pydata.org/pandas-docs/stable/ecosystem.html', + r'https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html', + r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm', + r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm', + r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm', + r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm', + r'https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm', + r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm', + r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm', + r'https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/', + r'pandas.zip' ] -linkcheck_ignore = [r'http://specs.frictionlessdata.io/json-table-schema/:\d+/'] -linkcheck_ignore = [r'https://'] -linkcheck_ignore = [r'https://cloud.google.com/bigquery/docs/access-control#roles:\d+/'] -linkcheck_ignore = [r'https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query:\d+/'] -linkcheck_ignore = [r'https://crates.io/crates/calamine:\d+/'] -linkcheck_ignore = [r'https://devguide.python.org/setup/#macos:\d+/'] -linkcheck_ignore = [r'https://en.wikipedia.org/wiki/Imputation_(statistics:\d+/'] -linkcheck_ignore = [r'https://github.com/noatamir/pandas-dev:\d+/'] -linkcheck_ignore = [r'https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1:\d+/'] -linkcheck_ignore = [r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568:\d+/'] -linkcheck_ignore = [r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495:\d+/'] -linkcheck_ignore = [r'https://github.com/pandas-dev/pandas/issues/174151:\d+/'] -linkcheck_ignore = [r'https://gitpod.io/#https://github.com/USERNAME/pandas:\d+/'] -linkcheck_ignore = [r'https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/:\d+/'] -linkcheck_ignore = [r'https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table:\d+/'] -linkcheck_ignore = [r'https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html:\d+/'] -linkcheck_ignore = [r'https://nbviewer.ipython.org/gist/metakermit/5720498:\d+/'] -linkcheck_ignore = [r'https://numpy.org/doc/stable/user/basics.byteswapping.html:\d+/'] -linkcheck_ignore = [r'https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0:\d+/'] -linkcheck_ignore = [r'https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking:\d+/'] -linkcheck_ignore = [r'https://pandas.pydata.org/pandas-docs/stable/ecosystem.html:\d+/'] -linkcheck_ignore = [r'https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html:\d+/'] -linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm:\d+/'] -linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm:\d+/'] -linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm:\d+/'] -linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm:\d+/'] -linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm:\d+/'] -linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm:\d+/'] -linkcheck_ignore = [r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm:\d+/'] -linkcheck_ignore = [r'https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/:\d+/'] -linkcheck_ignore = [r'pandas.zip:\d+/'] From 84f5dc4bfa7fc638f3c5e28cff8b0ef9618e4fc8 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Fri, 13 Oct 2023 01:39:01 +0530 Subject: [PATCH 27/49] Update conf.py --- doc/source/conf.py | 66 +++++++++++++++++++++++----------------------- 1 file changed, 33 insertions(+), 33 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 64d421d1c9dea..0ac6fed919ab2 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -803,37 +803,37 @@ def setup(app): ####### This is an ignore list for broken links found in CI run checks for broken-linkcheck.yml linkcheck_ignore = [ - r'http://', - r'http://scatterci.github.io/pydata/pandas', - r'http://specs.frictionlessdata.io/json-table-schema/', - r'https://', - r'https://cloud.google.com/bigquery/docs/access-control#roles', - r'https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query', - r'https://crates.io/crates/calamine', - r'https://devguide.python.org/setup/#macos', - r'https://en.wikipedia.org/wiki/Imputation_(statistics', - r'https://github.com/noatamir/pandas-dev', - r'https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1', - r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568', - r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495', - r'https://github.com/pandas-dev/pandas/issues/174151', - r'https://gitpod.io/#https://github.com/USERNAME/pandas', - r'https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/', - r'https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table', - r'https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html', - r'https://nbviewer.ipython.org/gist/metakermit/5720498', - r'https://numpy.org/doc/stable/user/basics.byteswapping.html', - r'https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0', - r'https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking', - r'https://pandas.pydata.org/pandas-docs/stable/ecosystem.html', - r'https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html', - r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm', - r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm', - r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm', - r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm', - r'https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm', - r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm', - r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm', - r'https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/', - r'pandas.zip' + re.escape(r'http://'), + re.escape((r'http://scatterci.github.io/pydata/pandas'), + re.escape(r'http://specs.frictionlessdata.io/json-table-schema/'), + re.escape(r'https://'), + re.escape(r'https://cloud.google.com/bigquery/docs/access-control#roles'), + re.escape((r'https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query'), + re.escape(r'https://crates.io/crates/calamine'), + re.escape(r'https://devguide.python.org/setup/#macos'), + re.escape(r'https://en.wikipedia.org/wiki/Imputation_(statistics'), + re.escape(r'https://github.com/noatamir/pandas-dev'), + re.escape(r'https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1'), + re.escape(r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568'), + re.escape(r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495'), + re.escape(r'https://github.com/pandas-dev/pandas/issues/174151'), + re.escape(r'https://gitpod.io/#https://github.com/USERNAME/pandas'), + re.escape(r'https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/'), + re.escape(r'https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table'), + re.escape(r'https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html'), + re.escape(r'https://nbviewer.ipython.org/gist/metakermit/5720498'), + re.escape(r'https://numpy.org/doc/stable/user/basics.byteswapping.html'), + re.escape(r'https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0'), + re.escape(r'https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking'), + re.escape(r'https://pandas.pydata.org/pandas-docs/stable/ecosystem.html'), + re.escape(r'https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html'), + re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm'), + re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm'), + re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm'), + re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm'), + re.escape(r'https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm'), + re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm'), + re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm'), + re.escape(r'https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/'), + re.escape(r'pandas.zip') ] From 5d7bbf0d3c35242930430a9fcd06e555b561f08c Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Fri, 13 Oct 2023 13:19:48 +0530 Subject: [PATCH 28/49] Update conf.py --- doc/source/conf.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 0ac6fed919ab2..d77ea07b7e2a9 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -804,11 +804,11 @@ def setup(app): linkcheck_ignore = [ re.escape(r'http://'), - re.escape((r'http://scatterci.github.io/pydata/pandas'), + re.escape(r'http://scatterci.github.io/pydata/pandas'), re.escape(r'http://specs.frictionlessdata.io/json-table-schema/'), re.escape(r'https://'), re.escape(r'https://cloud.google.com/bigquery/docs/access-control#roles'), - re.escape((r'https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query'), + re.escape(r'https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query'), re.escape(r'https://crates.io/crates/calamine'), re.escape(r'https://devguide.python.org/setup/#macos'), re.escape(r'https://en.wikipedia.org/wiki/Imputation_(statistics'), From bf443a6ac5de790472a3999e9191a1316db5c049 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Fri, 13 Oct 2023 15:49:26 +0530 Subject: [PATCH 29/49] Update conf.py --- doc/source/conf.py | 1 + 1 file changed, 1 insertion(+) diff --git a/doc/source/conf.py b/doc/source/conf.py index d77ea07b7e2a9..2cbe79428e1cf 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -16,6 +16,7 @@ import os import sys import warnings +import re import jinja2 from numpydoc.docscrape import NumpyDocString From cd90793cef9466d7ef1159d38452fdc82df90ccc Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Fri, 13 Oct 2023 17:02:05 +0530 Subject: [PATCH 30/49] Update conf.py --- doc/source/conf.py | 66 +++++++++++++++++++++++----------------------- 1 file changed, 33 insertions(+), 33 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 2cbe79428e1cf..f113cb9a7b158 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -804,37 +804,37 @@ def setup(app): ####### This is an ignore list for broken links found in CI run checks for broken-linkcheck.yml linkcheck_ignore = [ - re.escape(r'http://'), - re.escape(r'http://scatterci.github.io/pydata/pandas'), - re.escape(r'http://specs.frictionlessdata.io/json-table-schema/'), - re.escape(r'https://'), - re.escape(r'https://cloud.google.com/bigquery/docs/access-control#roles'), - re.escape(r'https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query'), - re.escape(r'https://crates.io/crates/calamine'), - re.escape(r'https://devguide.python.org/setup/#macos'), - re.escape(r'https://en.wikipedia.org/wiki/Imputation_(statistics'), - re.escape(r'https://github.com/noatamir/pandas-dev'), - re.escape(r'https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1'), - re.escape(r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568'), - re.escape(r'https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495'), - re.escape(r'https://github.com/pandas-dev/pandas/issues/174151'), - re.escape(r'https://gitpod.io/#https://github.com/USERNAME/pandas'), - re.escape(r'https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/'), - re.escape(r'https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table'), - re.escape(r'https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html'), - re.escape(r'https://nbviewer.ipython.org/gist/metakermit/5720498'), - re.escape(r'https://numpy.org/doc/stable/user/basics.byteswapping.html'), - re.escape(r'https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0'), - re.escape(r'https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking'), - re.escape(r'https://pandas.pydata.org/pandas-docs/stable/ecosystem.html'), - re.escape(r'https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html'), - re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm'), - re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm'), - re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm'), - re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm'), - re.escape(r'https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm'), - re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm'), - re.escape(r'https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm'), - re.escape(r'https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/'), - re.escape(r'pandas.zip') + re.escape('http://'), + re.escape('http://scatterci.github.io/pydata/pandas'), + re.escape('http://specs.frictionlessdata.io/json-table-schema/'), + re.escape('https://'), + re.escape('https://cloud.google.com/bigquery/docs/access-control#roles'), + re.escape('https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query'), + re.escape('https://crates.io/crates/calamine'), + re.escape('https://devguide.python.org/setup/#macos'), + re.escape('https://en.wikipedia.org/wiki/Imputation_(statistics'), + re.escape('https://github.com/noatamir/pandas-dev'), + re.escape('https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1'), + re.escape('https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568'), + re.escape('https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495'), + re.escape('https://github.com/pandas-dev/pandas/issues/174151'), + re.escape('https://gitpod.io/#https://github.com/USERNAME/pandas'), + re.escape('https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/'), + re.escape('https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table'), + re.escape('https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html'), + re.escape('https://nbviewer.ipython.org/gist/metakermit/5720498'), + re.escape('https://numpy.org/doc/stable/user/basics.byteswapping.html'), + re.escape('https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0'), + re.escape('https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking'), + re.escape('https://pandas.pydata.org/pandas-docs/stable/ecosystem.html'), + re.escape('https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html'), + re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm'), + re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm'), + re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm'), + re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm'), + re.escape('https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm'), + re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm'), + re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm'), + re.escape('https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/'), + re.escape('pandas.zip') ] From 10d92596a8e614ecd413fad1b361e933c5e5251f Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Sat, 14 Oct 2023 00:08:00 +0530 Subject: [PATCH 31/49] Update conf.py --- doc/source/conf.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index f113cb9a7b158..81cd0caa91423 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -804,10 +804,8 @@ def setup(app): ####### This is an ignore list for broken links found in CI run checks for broken-linkcheck.yml linkcheck_ignore = [ - re.escape('http://'), re.escape('http://scatterci.github.io/pydata/pandas'), re.escape('http://specs.frictionlessdata.io/json-table-schema/'), - re.escape('https://'), re.escape('https://cloud.google.com/bigquery/docs/access-control#roles'), re.escape('https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query'), re.escape('https://crates.io/crates/calamine'), From eb3daab11bba7ff9b534f98b6daf1770692027f7 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Sat, 14 Oct 2023 00:14:44 +0530 Subject: [PATCH 32/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 067bcda7a2eb2..129f6f6d7c8d5 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -1,6 +1,6 @@ name: Linkcheck on: - workflow_dispatch: + workflow_dispatch: # Enable manual triggering schedule: # Run monthly on the 1st day of the month From e19e2d146ce3d1fdb00aa3d4f0138203ec677789 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Wed, 18 Oct 2023 12:36:21 +0530 Subject: [PATCH 33/49] Update doc/source/conf.py Co-authored-by: Philip Meier --- doc/source/conf.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/doc/source/conf.py b/doc/source/conf.py index 81cd0caa91423..5fcd4234dad35 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -804,6 +804,8 @@ def setup(app): ####### This is an ignore list for broken links found in CI run checks for broken-linkcheck.yml linkcheck_ignore = [ + '^http://$', + '^https://$', re.escape('http://scatterci.github.io/pydata/pandas'), re.escape('http://specs.frictionlessdata.io/json-table-schema/'), re.escape('https://cloud.google.com/bigquery/docs/access-control#roles'), From 7099cea2bfe4c44232a86b93334f621c12bb789b Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Wed, 18 Oct 2023 15:58:01 +0530 Subject: [PATCH 34/49] Update conf.py --- doc/source/conf.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 5fcd4234dad35..8794153d17ee2 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -801,7 +801,8 @@ def setup(app): app.add_directive("autosummary", PandasAutosummary) -####### This is an ignore list for broken links found in CI run checks for broken-linkcheck.yml +####### This is an ignore list for broken links, +####### found in CI run checks for broken-linkcheck.yml linkcheck_ignore = [ '^http://$', From 36beaed1d981e114235c7a5e71ab7520854ee1cb Mon Sep 17 00:00:00 2001 From: "pre-commit-ci[bot]" <66853113+pre-commit-ci[bot]@users.noreply.github.com> Date: Wed, 18 Oct 2023 12:10:03 +0000 Subject: [PATCH 35/49] [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci --- doc/source/conf.py | 96 ++++++++++++++++++++++++++++++---------------- 1 file changed, 62 insertions(+), 34 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 8794153d17ee2..f352c50aa1bbb 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -14,9 +14,9 @@ import inspect import logging import os +import re import sys import warnings -import re import jinja2 from numpydoc.docscrape import NumpyDocString @@ -805,37 +805,65 @@ def setup(app): ####### found in CI run checks for broken-linkcheck.yml linkcheck_ignore = [ - '^http://$', - '^https://$', - re.escape('http://scatterci.github.io/pydata/pandas'), - re.escape('http://specs.frictionlessdata.io/json-table-schema/'), - re.escape('https://cloud.google.com/bigquery/docs/access-control#roles'), - re.escape('https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query'), - re.escape('https://crates.io/crates/calamine'), - re.escape('https://devguide.python.org/setup/#macos'), - re.escape('https://en.wikipedia.org/wiki/Imputation_(statistics'), - re.escape('https://github.com/noatamir/pandas-dev'), - re.escape('https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1'), - re.escape('https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568'), - re.escape('https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495'), - re.escape('https://github.com/pandas-dev/pandas/issues/174151'), - re.escape('https://gitpod.io/#https://github.com/USERNAME/pandas'), - re.escape('https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/'), - re.escape('https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table'), - re.escape('https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html'), - re.escape('https://nbviewer.ipython.org/gist/metakermit/5720498'), - re.escape('https://numpy.org/doc/stable/user/basics.byteswapping.html'), - re.escape('https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0'), - re.escape('https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking'), - re.escape('https://pandas.pydata.org/pandas-docs/stable/ecosystem.html'), - re.escape('https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html'), - re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm'), - re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm'), - re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm'), - re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm'), - re.escape('https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm'), - re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm'), - re.escape('https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm'), - re.escape('https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/'), - re.escape('pandas.zip') + "^http://$", + "^https://$", + re.escape("http://scatterci.github.io/pydata/pandas"), + re.escape("http://specs.frictionlessdata.io/json-table-schema/"), + re.escape("https://cloud.google.com/bigquery/docs/access-control#roles"), + re.escape( + "https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query" + ), + re.escape("https://crates.io/crates/calamine"), + re.escape("https://devguide.python.org/setup/#macos"), + re.escape("https://en.wikipedia.org/wiki/Imputation_(statistics"), + re.escape("https://github.com/noatamir/pandas-dev"), + re.escape( + "https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1" + ), + re.escape( + "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568" + ), + re.escape( + "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495" + ), + re.escape("https://github.com/pandas-dev/pandas/issues/174151"), + re.escape("https://gitpod.io/#https://github.com/USERNAME/pandas"), + re.escape("https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/"), + re.escape("https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table"), + re.escape( + "https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html" + ), + re.escape("https://nbviewer.ipython.org/gist/metakermit/5720498"), + re.escape("https://numpy.org/doc/stable/user/basics.byteswapping.html"), + re.escape( + "https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0" + ), + re.escape("https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking"), + re.escape("https://pandas.pydata.org/pandas-docs/stable/ecosystem.html"), + re.escape("https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html"), + re.escape( + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm" + ), + re.escape( + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm" + ), + re.escape( + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm" + ), + re.escape( + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm" + ), + re.escape( + "https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm" + ), + re.escape( + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm" + ), + re.escape( + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm" + ), + re.escape( + "https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/" + ), + re.escape("pandas.zip"), ] From faab0e2c1fe2a0cae9a193667c7056d709041bc2 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 26 Oct 2023 00:34:15 +0530 Subject: [PATCH 36/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Matthew Roeschke <10647082+mroeschke@users.noreply.github.com> --- .github/workflows/broken-linkcheck.yml | 2 -- 1 file changed, 2 deletions(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 129f6f6d7c8d5..032f681ab822d 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -1,7 +1,5 @@ name: Linkcheck on: - workflow_dispatch: - # Enable manual triggering schedule: # Run monthly on the 1st day of the month - cron: '0 0 1 * *' From 2d355f385dfb959eb8e1ca04920e64a5d4811c1d Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 26 Oct 2023 00:34:37 +0530 Subject: [PATCH 37/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Matthew Roeschke <10647082+mroeschke@users.noreply.github.com> --- .github/workflows/broken-linkcheck.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 032f681ab822d..2c044b7fb59b4 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -12,7 +12,7 @@ jobs: runs-on: ubuntu-latest defaults: run: - shell: bash -el {0} + shell: bash -el {0} steps: - name: Checkout From d148d535af825e53ec2f8d9bda12b75248ac921d Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 26 Oct 2023 00:35:19 +0530 Subject: [PATCH 38/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Matthew Roeschke <10647082+mroeschke@users.noreply.github.com> --- .github/workflows/broken-linkcheck.yml | 1 - 1 file changed, 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 2c044b7fb59b4..a24b2b0551020 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -25,7 +25,6 @@ jobs: - name: Build Pandas uses: ./.github/actions/build_pandas - - name: Run linkcheck script working-directory: ./doc run: | From b6d3825ebfe2c0eefb871196d7e1675a78b601ba Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 26 Oct 2023 00:38:50 +0530 Subject: [PATCH 39/49] Update conf.py --- doc/source/conf.py | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 8cfea7fe849fe..175512440118e 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -801,8 +801,7 @@ def setup(app): app.add_directive("autosummary", PandasAutosummary) -####### This is an ignore list for broken links, -####### found in CI run checks for broken-linkcheck.yml +#Ignore list for broken links,found in CI run checks for broken-linkcheck.yml linkcheck_ignore = [ "^http://$", From 9190aec38b01471396bf142430c0bce27621d10e Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 26 Oct 2023 00:41:58 +0530 Subject: [PATCH 40/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Matthew Roeschke <10647082+mroeschke@users.noreply.github.com> --- .github/workflows/broken-linkcheck.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index a24b2b0551020..322ebc30d9086 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -18,7 +18,7 @@ jobs: - name: Checkout uses: actions/checkout@v4 with: - fetch-depth: 0 + fetch-depth: 0 - name: Set up Conda uses: ./.github/actions/setup-conda From 4f7f3056992c47f77522a98ef5cc2e21d5235a9d Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 26 Oct 2023 01:17:14 +0530 Subject: [PATCH 41/49] Update conf.py --- doc/source/conf.py | 94 +++++++++++++++++----------------------------- 1 file changed, 34 insertions(+), 60 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 175512440118e..89233bcf30f41 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -803,66 +803,40 @@ def setup(app): #Ignore list for broken links,found in CI run checks for broken-linkcheck.yml -linkcheck_ignore = [ +links = [ "^http://$", "^https://$", - re.escape("http://scatterci.github.io/pydata/pandas"), - re.escape("http://specs.frictionlessdata.io/json-table-schema/"), - re.escape("https://cloud.google.com/bigquery/docs/access-control#roles"), - re.escape( - "https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query" - ), - re.escape("https://crates.io/crates/calamine"), - re.escape("https://devguide.python.org/setup/#macos"), - re.escape("https://en.wikipedia.org/wiki/Imputation_(statistics"), - re.escape("https://github.com/noatamir/pandas-dev"), - re.escape( - "https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1" - ), - re.escape( - "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568" - ), - re.escape( - "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495" - ), - re.escape("https://github.com/pandas-dev/pandas/issues/174151"), - re.escape("https://gitpod.io/#https://github.com/USERNAME/pandas"), - re.escape("https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/"), - re.escape("https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table"), - re.escape( - "https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html" - ), - re.escape("https://nbviewer.ipython.org/gist/metakermit/5720498"), - re.escape("https://numpy.org/doc/stable/user/basics.byteswapping.html"), - re.escape( - "https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0" - ), - re.escape("https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking"), - re.escape("https://pandas.pydata.org/pandas-docs/stable/ecosystem.html"), - re.escape("https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html"), - re.escape( - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm" - ), - re.escape( - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm" - ), - re.escape( - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm" - ), - re.escape( - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm" - ), - re.escape( - "https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm" - ), - re.escape( - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm" - ), - re.escape( - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm" - ), - re.escape( - "https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/" - ), - re.escape("pandas.zip"), + "http://scatterci.github.io/pydata/pandas", + "http://specs.frictionlessdata.io/json-table-schema/", + "https://cloud.google.com/bigquery/docs/access-control#roles", + "https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query", + "https://crates.io/crates/calamine", + "https://devguide.python.org/setup/#macos", + "https://en.wikipedia.org/wiki/Imputation_statistics", + "https://github.com/noatamir/pandas-dev", + "https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1", + "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568", + "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495", + "https://github.com/pandas-dev/pandas/issues/174151", + "https://gitpod.io/#https://github.com/USERNAME/pandas", + "https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/", + "https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table", + "https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html", + "https://nbviewer.ipython.org/gist/metakermit/5720498", + "https://numpy.org/doc/stable/user/basics.byteswapping.html", + "https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0", + "https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking", + "https://pandas.pydata.org/pandas-docs/stable/ecosystem.html", + "https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm", + "https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm", + "https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/", + "pandas.zip", ] + +linkcheck_ignore = [re.escape(link) for link in links] From fb086eae8d4db4bfd7a69f42d17abc4a4bda13ad Mon Sep 17 00:00:00 2001 From: "pre-commit-ci[bot]" <66853113+pre-commit-ci[bot]@users.noreply.github.com> Date: Wed, 25 Oct 2023 19:57:51 +0000 Subject: [PATCH 42/49] [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci --- doc/source/conf.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 89233bcf30f41..fd7af99825f6d 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -801,7 +801,7 @@ def setup(app): app.add_directive("autosummary", PandasAutosummary) -#Ignore list for broken links,found in CI run checks for broken-linkcheck.yml +# Ignore list for broken links,found in CI run checks for broken-linkcheck.yml links = [ "^http://$", From a88d02cdfebe6deaba77494d624193e62170ba31 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 26 Oct 2023 19:23:59 +0530 Subject: [PATCH 43/49] Update conf.py --- doc/source/conf.py | 1 + 1 file changed, 1 insertion(+) diff --git a/doc/source/conf.py b/doc/source/conf.py index fd7af99825f6d..58a91acfe6dbb 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -813,6 +813,7 @@ def setup(app): "https://crates.io/crates/calamine", "https://devguide.python.org/setup/#macos", "https://en.wikipedia.org/wiki/Imputation_statistics", + "https://en.wikipedia.org/wiki/Imputation_(statistics", "https://github.com/noatamir/pandas-dev", "https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1", "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568", From 8b62ee3ae2157424ef26aa1c50df8e7163581e29 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 26 Oct 2023 20:56:06 +0530 Subject: [PATCH 44/49] Update conf.py --- doc/source/conf.py | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 58a91acfe6dbb..1b9b68580510c 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -840,4 +840,11 @@ def setup(app): "pandas.zip", ] -linkcheck_ignore = [re.escape(link) for link in links] +# Exclude specific links from the links list + +excluded_links = ["^http://$", "^https://$"] +filtered_links = [link for link in links if link not in excluded_links] + +# Apply re.escape() to the filtered links + +linkcheck_ignore = [re.escape(link) for link in filtered_links] From 6231fd2b1adb9cf2074bb56ac4d19039df446878 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Thu, 26 Oct 2023 22:38:07 +0530 Subject: [PATCH 45/49] Update conf.py --- doc/source/conf.py | 79 ++++++++++++++++++++++------------------------ 1 file changed, 37 insertions(+), 42 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 1b9b68580510c..3f68dabffb4e6 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -803,48 +803,43 @@ def setup(app): # Ignore list for broken links,found in CI run checks for broken-linkcheck.yml -links = [ +linkcheck_ignore = [ "^http://$", "^https://$", - "http://scatterci.github.io/pydata/pandas", - "http://specs.frictionlessdata.io/json-table-schema/", - "https://cloud.google.com/bigquery/docs/access-control#roles", - "https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query", - "https://crates.io/crates/calamine", - "https://devguide.python.org/setup/#macos", - "https://en.wikipedia.org/wiki/Imputation_statistics", - "https://en.wikipedia.org/wiki/Imputation_(statistics", - "https://github.com/noatamir/pandas-dev", - "https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1", - "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568", - "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495", - "https://github.com/pandas-dev/pandas/issues/174151", - "https://gitpod.io/#https://github.com/USERNAME/pandas", - "https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/", - "https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table", - "https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html", - "https://nbviewer.ipython.org/gist/metakermit/5720498", - "https://numpy.org/doc/stable/user/basics.byteswapping.html", - "https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0", - "https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking", - "https://pandas.pydata.org/pandas-docs/stable/ecosystem.html", - "https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html", - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm", - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm", - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm", - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm", - "https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm", - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm", - "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm", - "https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/", - "pandas.zip", + *[ + re.escape(link) + for link in [ + "http://scatterci.github.io/pydata/pandas", + "http://specs.frictionlessdata.io/json-table-schema/", + "https://cloud.google.com/bigquery/docs/access-control#roles", + "https://cloud.google.com/bigquery/docs/reference/rest/v2/jobs#configuration.query", + "https://crates.io/crates/calamine", + "https://devguide.python.org/setup/#macos", + "https://en.wikipedia.org/wiki/Imputation_statistics", + "https://en.wikipedia.org/wiki/Imputation_(statistics", + "https://github.com/noatamir/pandas-dev", + "https://github.com/pandas-dev/pandas/blob/main/pandas/plotting/__init__.py#L1", + "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/generic.py#L568", + "https://github.com/pandas-dev/pandas/blob/v0.20.2/pandas/core/frame.py#L1495", + "https://github.com/pandas-dev/pandas/issues/174151", + "https://gitpod.io/#https://github.com/USERNAME/pandas", + "https://manishamde.github.io/blog/2013/03/07/pandas-and-python-top-10/", + "https://matplotlib.org/api/axes_api.html#matplotlib.axes.Axes.table", + "https://nipunbatra.github.io/blog/visualisation/2013/05/01/aggregation-timeseries.html", + "https://nbviewer.ipython.org/gist/metakermit/5720498", + "https://numpy.org/doc/stable/user/basics.byteswapping.html", + "https://pandas-gbq.readthedocs.io/en/latest/changelog.html#changelog-0-8-0", + "https://pandas.pydata.org/pandas-docs/stable/io.html#io-chunking", + "https://pandas.pydata.org/pandas-docs/stable/ecosystem.html", + "https://sqlalchemy.readthedocs.io/en/latest/dialects/index.html", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245912.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000214639.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002283942.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a000245965.htm", + "https://support.sas.com/documentation/cdl/en/imlug/66845/HTML/default/viewer.htm#imlug_langref_sect455.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm", + "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm", + "https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/", + "pandas.zip",] + ] ] - -# Exclude specific links from the links list - -excluded_links = ["^http://$", "^https://$"] -filtered_links = [link for link in links if link not in excluded_links] - -# Apply re.escape() to the filtered links - -linkcheck_ignore = [re.escape(link) for link in filtered_links] From f4e9d1caade4e44fd0a5fc20ed8416083b61bb70 Mon Sep 17 00:00:00 2001 From: "pre-commit-ci[bot]" <66853113+pre-commit-ci[bot]@users.noreply.github.com> Date: Thu, 26 Oct 2023 17:17:35 +0000 Subject: [PATCH 46/49] [pre-commit.ci] auto fixes from pre-commit.com hooks for more information, see https://pre-commit.ci --- doc/source/conf.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 3f68dabffb4e6..7b86e9399bc85 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -840,6 +840,7 @@ def setup(app): "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm", "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm", "https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/", - "pandas.zip",] - ] + "pandas.zip", + ] + ], ] From 368b4bc02a35a1d48273cecdd39648d40ffe12b6 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Tue, 7 Nov 2023 23:46:45 +0530 Subject: [PATCH 47/49] Update .github/workflows/broken-linkcheck.yml Co-authored-by: Matthew Roeschke <10647082+mroeschke@users.noreply.github.com> --- .github/workflows/broken-linkcheck.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 322ebc30d9086..048a54e9d3e30 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -25,6 +25,7 @@ jobs: - name: Build Pandas uses: ./.github/actions/build_pandas + - name: Run linkcheck script working-directory: ./doc run: | From 0b22bea3449d8e13f9308c9e694ff44af503a73b Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Wed, 8 Nov 2023 00:02:34 +0530 Subject: [PATCH 48/49] Update broken-linkcheck.yml --- .github/workflows/broken-linkcheck.yml | 60 +++++++++++++------------- 1 file changed, 30 insertions(+), 30 deletions(-) diff --git a/.github/workflows/broken-linkcheck.yml b/.github/workflows/broken-linkcheck.yml index 048a54e9d3e30..10ab5b08a4437 100644 --- a/.github/workflows/broken-linkcheck.yml +++ b/.github/workflows/broken-linkcheck.yml @@ -1,38 +1,38 @@ name: Linkcheck on: - schedule: - # Run monthly on the 1st day of the month - - cron: '0 0 1 * *' - pull_request: - paths: - - ".github/workflows/broken-linkcheck.yml" - - "doc/make.py" + schedule: + # Run monthly on the 1st day of the month + - cron: '0 0 1 * *' + pull_request: + paths: + - ".github/workflows/broken-linkcheck.yml" + - "doc/make.py" jobs: - linkcheck: - runs-on: ubuntu-latest - defaults: - run: - shell: bash -el {0} + linkcheck: + runs-on: ubuntu-latest + defaults: + run: + shell: bash -el {0} - steps: - - name: Checkout - uses: actions/checkout@v4 - with: - fetch-depth: 0 + steps: + - name: Checkout + uses: actions/checkout@v4 + with: + fetch-depth: 0 - - name: Set up Conda - uses: ./.github/actions/setup-conda + - name: Set up Conda + uses: ./.github/actions/setup-conda - - name: Build Pandas - uses: ./.github/actions/build_pandas + - name: Build Pandas + uses: ./.github/actions/build_pandas - - name: Run linkcheck script - working-directory: ./doc - run: | - set -o pipefail - python make.py linkcheck | tee linkcheck.txt + - name: Run linkcheck script + working-directory: ./doc + run: | + set -o pipefail + python make.py linkcheck | tee linkcheck.txt - - name: Display broken links - if: failure() - working-directory: ./doc - run: grep broken linkcheck.txt + - name: Display broken links + if: failure() + working-directory: ./doc + run: grep broken linkcheck.txt From c36aa096063611ede664a51dcd4da27ef8856d33 Mon Sep 17 00:00:00 2001 From: AG <98327736+ggold7046@users.noreply.github.com> Date: Wed, 8 Nov 2023 01:22:27 +0530 Subject: [PATCH 49/49] Update conf.py --- doc/source/conf.py | 1 + 1 file changed, 1 insertion(+) diff --git a/doc/source/conf.py b/doc/source/conf.py index 7b86e9399bc85..6b52b52ce5e13 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -840,6 +840,7 @@ def setup(app): "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002284668.htm", "https://support.sas.com/documentation/cdl/en/lrdict/64316/HTML/default/viewer.htm#a002978282.htm", "https://wesmckinney.com/blog/update-on-upcoming-pandas-v0-10-new-file-parser-other-performance-wins/", + "https://visualstudio.microsoft.com/downloads/#build-tools-for-visual-studio-2022", "pandas.zip", ] ],