From de05a2724126d9f1ac9da4c2c62b7d67381f61a2 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 12:38:18 +0530 Subject: [PATCH 01/65] Create main.yml --- .github/workflows/main.yml | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) create mode 100644 .github/workflows/main.yml diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml new file mode 100644 index 0000000..1bde2bf --- /dev/null +++ b/.github/workflows/main.yml @@ -0,0 +1,18 @@ + - name: Setup Go environment + uses: actions/setup-go@v4.1.0 + with: + # The Go version to download (if necessary) and use. Supports semver spec and ranges. Be sure to enclose this option in single quotation marks. + go-version: # optional + # Path to the go.mod or go.work file. + go-version-file: # optional + # Set this option to true if you want the action to always check for the latest available version that satisfies the version spec + check-latest: # optional + # Used to pull Go distributions from go-versions. Since there's a default, this is typically not supplied by the user. When running this action on github.com, the default value is sufficient. When running on GHES, you can pass a personal access token for github.com if you are experiencing rate limiting. + token: # optional, default is ${{ github.server_url == 'https://github.com' && github.token || '' }} + # Used to specify whether caching is needed. Set to true, if you'd like to enable caching. + cache: # optional, default is true + # Used to specify the path to a dependency file - go.sum + cache-dependency-path: # optional + # Target architecture for Go to use. Examples: x86, x64. Will use system architecture by default. + architecture: # optional + From 0eacde968124173f19ac96bb92a8f5d9079b7a8f Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 13:45:20 +0530 Subject: [PATCH 02/65] Update main.yml --- .github/workflows/main.yml | 42 ++++++++++++++++++++++---------------- 1 file changed, 24 insertions(+), 18 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 1bde2bf..562089d 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -1,18 +1,24 @@ - - name: Setup Go environment - uses: actions/setup-go@v4.1.0 - with: - # The Go version to download (if necessary) and use. Supports semver spec and ranges. Be sure to enclose this option in single quotation marks. - go-version: # optional - # Path to the go.mod or go.work file. - go-version-file: # optional - # Set this option to true if you want the action to always check for the latest available version that satisfies the version spec - check-latest: # optional - # Used to pull Go distributions from go-versions. Since there's a default, this is typically not supplied by the user. When running this action on github.com, the default value is sufficient. When running on GHES, you can pass a personal access token for github.com if you are experiencing rate limiting. - token: # optional, default is ${{ github.server_url == 'https://github.com' && github.token || '' }} - # Used to specify whether caching is needed. Set to true, if you'd like to enable caching. - cache: # optional, default is true - # Used to specify the path to a dependency file - go.sum - cache-dependency-path: # optional - # Target architecture for Go to use. Examples: x86, x64. Will use system architecture by default. - architecture: # optional - +name: Your Workflow Name + +on: + schedule: + - cron: '*/20 * * * *' + +jobs: + setup-go: + runs-on: ubuntu-latest + + steps: + - name: Checkout Repository + uses: actions/checkout@v2 + + - name: Setup Go environment + uses: actions/setup-go@v4.1.0 + with: + go-version: # specify your Go version if needed + go-version-file: # specify your go version file if needed + check-latest: # specify if you want to check for the latest version + token: ${{ github.token }} + cache: true + cache-dependency-path: # specify your cache dependency path if needed + architecture: # specify your target architecture if needed From 45772841ce019107d4c79bb02f5199757148fb06 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 14:00:40 +0530 Subject: [PATCH 03/65] Update main.yml --- .github/workflows/main.yml | 24 +++++++++--------------- 1 file changed, 9 insertions(+), 15 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 562089d..e3fac57 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -1,24 +1,18 @@ -name: Your Workflow Name +name: Scheduled Workflow on: schedule: - - cron: '*/20 * * * *' + - cron: '0 * * * *' # Run every hour jobs: - setup-go: + run-code: runs-on: ubuntu-latest steps: - - name: Checkout Repository - uses: actions/checkout@v2 + - name: Checkout repository + uses: actions/checkout@v2 + + - name: Run code + run: | + rbiparser download -d "./xls" - - name: Setup Go environment - uses: actions/setup-go@v4.1.0 - with: - go-version: # specify your Go version if needed - go-version-file: # specify your go version file if needed - check-latest: # specify if you want to check for the latest version - token: ${{ github.token }} - cache: true - cache-dependency-path: # specify your cache dependency path if needed - architecture: # specify your target architecture if needed From 6c0a5876bc87ec694b86644a1bacdb4ba4d0f350 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 14:09:48 +0530 Subject: [PATCH 04/65] Update main.yml --- .github/workflows/main.yml | 11 +++++++++-- 1 file changed, 9 insertions(+), 2 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index e3fac57..0779b99 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -12,7 +12,14 @@ jobs: - name: Checkout repository uses: actions/checkout@v2 - - name: Run code + - name: Run code and save output run: | - rbiparser download -d "./xls" + rbiparser download -d "./xls" > output.txt + + + - name: Upload artifact + uses: actions/upload-artifact@v2 + with: + name: my-script-output + path: output.txt From e4dfba409b144090b0daaf2d25b6f0d3feb10009 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 14:50:33 +0530 Subject: [PATCH 05/65] Update main.yml --- .github/workflows/main.yml | 13 +++---------- 1 file changed, 3 insertions(+), 10 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 0779b99..1a7bb43 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -2,7 +2,7 @@ name: Scheduled Workflow on: schedule: - - cron: '0 * * * *' # Run every hour + - cron: '*/4 * * * *' # Run every 4 minutes jobs: run-code: @@ -12,14 +12,7 @@ jobs: - name: Checkout repository uses: actions/checkout@v2 - - name: Run code and save output + - name: Run code run: | - rbiparser download -d "./xls" > output.txt + rbiparser download -d "./xls" - - - - name: Upload artifact - uses: actions/upload-artifact@v2 - with: - name: my-script-output - path: output.txt From 19b382682b07fce2dee85b489d37875544b2d7a4 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 14:50:55 +0530 Subject: [PATCH 06/65] Update main.yml --- .github/workflows/main.yml | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 1a7bb43..8763936 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -14,5 +14,4 @@ jobs: - name: Run code run: | - rbiparser download -d "./xls" - + rbiparser download -d "./xls" From 142fb632754822c0681abac71d5f4f01d6ad3a6f Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:04:41 +0530 Subject: [PATCH 07/65] Update main.yml s --- .github/workflows/main.yml | 24 ++++++++++++++++-------- 1 file changed, 16 insertions(+), 8 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 8763936..10e20f2 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -1,17 +1,25 @@ -name: Scheduled Workflow +name: run main.py on: schedule: - - cron: '*/4 * * * *' # Run every 4 minutes + - cron: '*/10 * * * *' # At every 10th minute of every hour jobs: - run-code: + build: runs-on: ubuntu-latest - steps: - - name: Checkout repository - uses: actions/checkout@v2 + - name: checkout repo content + uses: actions/checkout@v2 # checkout the repository content + + - name: setup python + uses: actions/setup-python@v4 + with: + python-version: '3.10' # install the python version needed - - name: Run code + - name: install python packages run: | - rbiparser download -d "./xls" + python -m pip install --upgrade pip + pip install -r requirements.txt + + - name: execute py script # run main.py + run: python main.py From e498791eaaccc9f14549f5cea1e66f6a0f752345 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:10:38 +0530 Subject: [PATCH 08/65] Create python-app.yml ok --- .github/workflows/python-app.yml | 26 ++++++++++++++++++++++++++ 1 file changed, 26 insertions(+) create mode 100644 .github/workflows/python-app.yml diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml new file mode 100644 index 0000000..015f11c --- /dev/null +++ b/.github/workflows/python-app.yml @@ -0,0 +1,26 @@ +name: run main.py every 10 minutes + +on: + schedule: + - cron: '*/10 * * * *' # At every 10th minute of every hour + +jobs: + build: + runs-on: ubuntu-latest + steps: + - name: checkout repo content + uses: actions/checkout@v2 # checkout the repository content + + - name: setup python + uses: actions/setup-python@v4 + with: + python-version: '2.7' # install the python version needed + + - name: install python packages + run: | + python -m pip install --upgrade pip + pip install -r requirements.txt + + + - name: execute py script # run main.py + run: rbiparser download -d "./xls" From 84a924d034d86d0eb506226779995180f9b5ec79 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:12:16 +0530 Subject: [PATCH 09/65] Update main.yml --- .github/workflows/main.yml | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 10e20f2..015f11c 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -1,4 +1,4 @@ -name: run main.py +name: run main.py every 10 minutes on: schedule: @@ -14,12 +14,13 @@ jobs: - name: setup python uses: actions/setup-python@v4 with: - python-version: '3.10' # install the python version needed + python-version: '2.7' # install the python version needed - name: install python packages run: | python -m pip install --upgrade pip pip install -r requirements.txt + - name: execute py script # run main.py - run: python main.py + run: rbiparser download -d "./xls" From 02be71ead33a568b35de7771bb9f495aa0808c7d Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:16:49 +0530 Subject: [PATCH 10/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 015f11c..ef71605 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -19,7 +19,7 @@ jobs: - name: install python packages run: | python -m pip install --upgrade pip - pip install -r requirements.txt + pip install rbiparser - name: execute py script # run main.py From 70c5b0bd33215718ff719f5d7024e9075ce218bf Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:23:51 +0530 Subject: [PATCH 11/65] Update main.yml --- .github/workflows/main.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index ef71605..9b1cc75 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -2,7 +2,7 @@ name: run main.py every 10 minutes on: schedule: - - cron: '*/10 * * * *' # At every 10th minute of every hour + - cron: '*/2 * * * *' # At every 10th minute of every hour jobs: build: @@ -14,7 +14,7 @@ jobs: - name: setup python uses: actions/setup-python@v4 with: - python-version: '2.7' # install the python version needed + python-version: '3.10' # install the python version needed - name: install python packages run: | From b7ed95e78cf708d60b5ad9a1d270f143fe589129 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:28:21 +0530 Subject: [PATCH 12/65] Update python-app.yml --- .github/workflows/python-app.yml | 25 ------------------------- 1 file changed, 25 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index 015f11c..8b13789 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -1,26 +1 @@ -name: run main.py every 10 minutes -on: - schedule: - - cron: '*/10 * * * *' # At every 10th minute of every hour - -jobs: - build: - runs-on: ubuntu-latest - steps: - - name: checkout repo content - uses: actions/checkout@v2 # checkout the repository content - - - name: setup python - uses: actions/setup-python@v4 - with: - python-version: '2.7' # install the python version needed - - - name: install python packages - run: | - python -m pip install --upgrade pip - pip install -r requirements.txt - - - - name: execute py script # run main.py - run: rbiparser download -d "./xls" From 0455f20e0a57a7650c157f3eade50efd86fd4b81 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:31:21 +0530 Subject: [PATCH 13/65] Update main.yml --- .github/workflows/main.yml | 15 +++++++-------- 1 file changed, 7 insertions(+), 8 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 9b1cc75..7422384 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -1,26 +1,25 @@ -name: run main.py every 10 minutes +name: Run main.py every 2 minutes on: schedule: - - cron: '*/2 * * * *' # At every 10th minute of every hour + - cron: '*/2 * * * *' # At every 2nd minute of every hour jobs: build: runs-on: ubuntu-latest steps: - - name: checkout repo content + - name: Checkout repo content uses: actions/checkout@v2 # checkout the repository content - - name: setup python + - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.10' # install the python version needed + python-version: '3.10' # install the Python version needed - - name: install python packages + - name: Install Python packages run: | python -m pip install --upgrade pip pip install rbiparser - - - name: execute py script # run main.py + - name: Execute Python script run: rbiparser download -d "./xls" From cf8e571138e09ebb6bb3d8d02ff63dd73054769a Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:38:49 +0530 Subject: [PATCH 14/65] Update python-app.yml --- .github/workflows/python-app.yml | 25 +++++++++++++++++++++++++ 1 file changed, 25 insertions(+) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index 8b13789..e8e2d5a 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -1 +1,26 @@ +name: Run main.py every 2 minutes + +on: + schedule: + - cron: '*/2 * * * *' # At every 2nd minute of every hour + +jobs: + build: + runs-on: ubuntu-latest + steps: + - name: Checkout repo content + uses: actions/checkout@v2 # checkout the repository content + + - name: Setup Python + uses: actions/setup-python@v4 + with: + python-version: '3.10' # install the Python version needed + + - name: Install Python packages + run: | + python -m pip install --upgrade pip + pip install rbiparser + + - name: Execute Python script + run: rbiparser download -d "./xls" From 6c380544e06baf7db5fd41bb888655484a42792a Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:51:55 +0530 Subject: [PATCH 15/65] Update main.yml --- .github/workflows/main.yml | 11 ++++++++--- 1 file changed, 8 insertions(+), 3 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 7422384..a28e706 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -9,12 +9,12 @@ jobs: runs-on: ubuntu-latest steps: - name: Checkout repo content - uses: actions/checkout@v2 # checkout the repository content + uses: actions/checkout@v2 - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.10' # install the Python version needed + python-version: '3.10' - name: Install Python packages run: | @@ -22,4 +22,9 @@ jobs: pip install rbiparser - name: Execute Python script - run: rbiparser download -d "./xls" + run: | + echo "Checking current directory contents:" + ls -al + + echo "Running rbiparser download -d './xls':" + rbiparser download -d "./xls" From 46874a0f73438d4b462d876546e22c66374eb5ea Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:52:17 +0530 Subject: [PATCH 16/65] Update python-app.yml --- .github/workflows/python-app.yml | 12 ++++++++---- 1 file changed, 8 insertions(+), 4 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index e8e2d5a..a28e706 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -1,4 +1,3 @@ - name: Run main.py every 2 minutes on: @@ -10,12 +9,12 @@ jobs: runs-on: ubuntu-latest steps: - name: Checkout repo content - uses: actions/checkout@v2 # checkout the repository content + uses: actions/checkout@v2 - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.10' # install the Python version needed + python-version: '3.10' - name: Install Python packages run: | @@ -23,4 +22,9 @@ jobs: pip install rbiparser - name: Execute Python script - run: rbiparser download -d "./xls" + run: | + echo "Checking current directory contents:" + ls -al + + echo "Running rbiparser download -d './xls':" + rbiparser download -d "./xls" From 546002e3d9edf068de5bab12084e0ab919843927 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:56:12 +0530 Subject: [PATCH 17/65] Update main.yml From 0eff210e895a74dea534d2f31d0561df8354f949 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 15:56:35 +0530 Subject: [PATCH 18/65] Update python-app.yml From b166559c8084790cf81cef8500a3689914b0c76e Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:03:28 +0530 Subject: [PATCH 19/65] Create requirement.txt --- requirement.txt | 6 ++++++ 1 file changed, 6 insertions(+) create mode 100644 requirement.txt diff --git a/requirement.txt b/requirement.txt new file mode 100644 index 0000000..37b3f7a --- /dev/null +++ b/requirement.txt @@ -0,0 +1,6 @@ +rbiparser +requests +xlrd +beautifulsoup4 +click +lxml From 59be47d483d7e8cb84ee71e993ec8a50c856b68a Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:04:13 +0530 Subject: [PATCH 20/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index a28e706..da8e077 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -19,7 +19,7 @@ jobs: - name: Install Python packages run: | python -m pip install --upgrade pip - pip install rbiparser + pip install -r requirements.txt - name: Execute Python script run: | From 25fdc437663aa4cbd034cd26608dc82e0b408136 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:05:54 +0530 Subject: [PATCH 21/65] Update main.yml d --- .github/workflows/main.yml | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index da8e077..e7ed84c 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -21,10 +21,9 @@ jobs: python -m pip install --upgrade pip pip install -r requirements.txt - - name: Execute Python script + - name: remove rbiparser.egg-info run: | - echo "Checking current directory contents:" - ls -al + rm -rf rbiparser.egg-info - echo "Running rbiparser download -d './xls':" - rbiparser download -d "./xls" + - name: execute rbiparser + run: rbiparser download -d "./xls" From e39860ee558638c0520dff399fb9be4fc95809d8 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:07:43 +0530 Subject: [PATCH 22/65] Update python-app.yml --- .github/workflows/python-app.yml | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index a28e706..5b13bb3 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -21,10 +21,9 @@ jobs: python -m pip install --upgrade pip pip install rbiparser - - name: Execute Python script + - name: remove rbiparser.egg-info run: | - echo "Checking current directory contents:" - ls -al + rm -rf rbiparser.egg-info - echo "Running rbiparser download -d './xls':" - rbiparser download -d "./xls" + - name: execute rbiparser + run: rbiparser download -d "./xls" From cbeb04bcfec28195ae7a748962ef20c813696f51 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:15:39 +0530 Subject: [PATCH 23/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index e7ed84c..c9345f3 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -19,7 +19,7 @@ jobs: - name: Install Python packages run: | python -m pip install --upgrade pip - pip install -r requirements.txt + pip install -r requirement.txt - name: remove rbiparser.egg-info run: | From c9707dafde7f22275b6ec1fb62eff222fdab1c3f Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:26:46 +0530 Subject: [PATCH 24/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index c9345f3..f2c46b3 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -26,4 +26,4 @@ jobs: rm -rf rbiparser.egg-info - name: execute rbiparser - run: rbiparser download -d "./xls" + run: rbiparser combine --help From 5f3d4b6344a6d6d6bf957e5566c80dd6cf16516a Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:32:45 +0530 Subject: [PATCH 25/65] Update python-app.yml --- .github/workflows/python-app.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index 5b13bb3..cdd7c76 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -26,4 +26,4 @@ jobs: rm -rf rbiparser.egg-info - name: execute rbiparser - run: rbiparser download -d "./xls" + run: rbiparser combine --help From 71abaadb164dcaab32f994ec6d41266d324cdaa9 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:33:21 +0530 Subject: [PATCH 26/65] Update main.yml From fe26283bbe3f3ec8a479dda250dae1c12e64c90e Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:39:44 +0530 Subject: [PATCH 27/65] Update main.yml --- .github/workflows/main.yml | 16 +++++++++++----- 1 file changed, 11 insertions(+), 5 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index f2c46b3..00902d7 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -11,6 +11,11 @@ jobs: - name: Checkout repo content uses: actions/checkout@v2 + - name: Install Dependencies + run: | + sudo apt-get update + sudo apt-get install -y # Replace with the actual package name + - name: Setup Python uses: actions/setup-python@v4 with: @@ -19,11 +24,12 @@ jobs: - name: Install Python packages run: | python -m pip install --upgrade pip - pip install -r requirement.txt + pip install rbiparser - - name: remove rbiparser.egg-info + - name: Execute Python script run: | - rm -rf rbiparser.egg-info + echo "Checking current directory contents:" + ls -al - - name: execute rbiparser - run: rbiparser combine --help + echo "Running rbiparser download -d './xls':" + rbiparser download -d "./xls" From cfefa56f347774bd2fd95dcc312126b714f2779b Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:42:03 +0530 Subject: [PATCH 28/65] Update main.yml --- .github/workflows/main.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 00902d7..f2c224d 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -33,3 +33,4 @@ jobs: echo "Running rbiparser download -d './xls':" rbiparser download -d "./xls" + From 22dc5bf2915f140f3404c3545d60db2cefaf18f3 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:42:24 +0530 Subject: [PATCH 29/65] Update python-app.yml --- .github/workflows/python-app.yml | 14 ++++++++++---- 1 file changed, 10 insertions(+), 4 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index cdd7c76..00902d7 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -11,6 +11,11 @@ jobs: - name: Checkout repo content uses: actions/checkout@v2 + - name: Install Dependencies + run: | + sudo apt-get update + sudo apt-get install -y # Replace with the actual package name + - name: Setup Python uses: actions/setup-python@v4 with: @@ -21,9 +26,10 @@ jobs: python -m pip install --upgrade pip pip install rbiparser - - name: remove rbiparser.egg-info + - name: Execute Python script run: | - rm -rf rbiparser.egg-info + echo "Checking current directory contents:" + ls -al - - name: execute rbiparser - run: rbiparser combine --help + echo "Running rbiparser download -d './xls':" + rbiparser download -d "./xls" From 7cbf28e169bae22056ad88131542c484d7352906 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:52:25 +0530 Subject: [PATCH 30/65] Update main.yml --- .github/workflows/main.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index f2c224d..94b81f7 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -13,8 +13,9 @@ jobs: - name: Install Dependencies run: | - sudo apt-get update - sudo apt-get install -y # Replace with the actual package name + sudo apt-get update + sudo apt-get install -y + - name: Setup Python uses: actions/setup-python@v4 From aba7491e49abb42b719818ae9020297b65d461ce Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 16:52:41 +0530 Subject: [PATCH 31/65] Update python-app.yml --- .github/workflows/python-app.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index 00902d7..d2dece1 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -13,8 +13,9 @@ jobs: - name: Install Dependencies run: | - sudo apt-get update - sudo apt-get install -y # Replace with the actual package name + sudo apt-get update + sudo apt-get install -y + - name: Setup Python uses: actions/setup-python@v4 From 9fe12413b67d3f3114bb3453e3b50f413eda260c Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:15:58 +0530 Subject: [PATCH 32/65] Update main.yml --- .github/workflows/main.yml | 10 ++++------ 1 file changed, 4 insertions(+), 6 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 94b81f7..1f6dd15 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -11,14 +11,13 @@ jobs: - name: Checkout repo content uses: actions/checkout@v2 - - name: Install Dependencies + - name: Update package lists and install dependencies run: | - sudo apt-get update - sudo apt-get install -y - + sudo apt-get update + sudo apt-get install -y # Replace with the actual package name - name: Setup Python - uses: actions/setup-python@v4 + uses: actions/setup-python@v2 with: python-version: '3.10' @@ -34,4 +33,3 @@ jobs: echo "Running rbiparser download -d './xls':" rbiparser download -d "./xls" - From 5ee79bdaf77a8cf3c9dd5c3c2401c87b10d421ac Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:16:11 +0530 Subject: [PATCH 33/65] Update python-app.yml --- .github/workflows/python-app.yml | 9 ++++----- 1 file changed, 4 insertions(+), 5 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index d2dece1..1f6dd15 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -11,14 +11,13 @@ jobs: - name: Checkout repo content uses: actions/checkout@v2 - - name: Install Dependencies + - name: Update package lists and install dependencies run: | - sudo apt-get update - sudo apt-get install -y - + sudo apt-get update + sudo apt-get install -y # Replace with the actual package name - name: Setup Python - uses: actions/setup-python@v4 + uses: actions/setup-python@v2 with: python-version: '3.10' From 1de3f792f640758a50b94e337dc20c1272522d9f Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:25:11 +0530 Subject: [PATCH 34/65] Update main.yml --- .github/workflows/main.yml | 7 +------ 1 file changed, 1 insertion(+), 6 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 1f6dd15..a28e706 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -11,13 +11,8 @@ jobs: - name: Checkout repo content uses: actions/checkout@v2 - - name: Update package lists and install dependencies - run: | - sudo apt-get update - sudo apt-get install -y # Replace with the actual package name - - name: Setup Python - uses: actions/setup-python@v2 + uses: actions/setup-python@v4 with: python-version: '3.10' From d7b915feaa378c31db6e3247ddd342d23f97b99e Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:25:25 +0530 Subject: [PATCH 35/65] Update python-app.yml --- .github/workflows/python-app.yml | 7 +------ 1 file changed, 1 insertion(+), 6 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index 1f6dd15..a28e706 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -11,13 +11,8 @@ jobs: - name: Checkout repo content uses: actions/checkout@v2 - - name: Update package lists and install dependencies - run: | - sudo apt-get update - sudo apt-get install -y # Replace with the actual package name - - name: Setup Python - uses: actions/setup-python@v2 + uses: actions/setup-python@v4 with: python-version: '3.10' From 397bac62a1810d47df67f3ce33120dfdc99d748b Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:31:23 +0530 Subject: [PATCH 36/65] Update main.yml --- .github/workflows/main.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index a28e706..d81af54 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -26,5 +26,6 @@ jobs: echo "Checking current directory contents:" ls -al - echo "Running rbiparser download -d './xls':" - rbiparser download -d "./xls" + echo "Running rbiparser combine --help:" + rbiparser combine --help + From d8e912d233e9bd281bb1842fd986c71f320ffde4 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:31:49 +0530 Subject: [PATCH 37/65] Update python-app.yml --- .github/workflows/python-app.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index a28e706..06503dc 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -26,5 +26,5 @@ jobs: echo "Checking current directory contents:" ls -al - echo "Running rbiparser download -d './xls':" - rbiparser download -d "./xls" + echo "Running rbiparser combine --help:" + rbiparser combine --help From 36f5a11898dd7c38352a0725379df66555a9818c Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:39:11 +0530 Subject: [PATCH 38/65] Update __init__.py --- rbiparser/__init__.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index 2199b65..74234b6 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -77,7 +77,7 @@ def get_sheet_urls(url): # Extract the urls. s = soup(r.content, "lxml") - links = s.findAll("a", href=re.compile("\.xlsx$")) + links = s.find_all("a", href=re.compile(".\.xls.")) if len(links) < 1: raise Exception("Couldn't find any .xlsx urls") From 1724cb7d400f1404d8302266e8525df641b2049d Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:40:07 +0530 Subject: [PATCH 39/65] Update main.yml --- .github/workflows/main.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index d81af54..74ffd3b 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -26,6 +26,7 @@ jobs: echo "Checking current directory contents:" ls -al - echo "Running rbiparser combine --help:" - rbiparser combine --help + echo "Running rbiparser download -d "./xls":" + rbiparser download -d "./xls" + From 78debb6860110b9340c14b15486f0eab0836f677 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:40:29 +0530 Subject: [PATCH 40/65] Update python-app.yml --- .github/workflows/python-app.yml | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index 06503dc..bc10ff5 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -26,5 +26,6 @@ jobs: echo "Checking current directory contents:" ls -al - echo "Running rbiparser combine --help:" - rbiparser combine --help + echo "Running rbiparser download -d "./xls":" + rbiparser download -d "./xls" + From 1e518279d4ab001535641f389cb21b2bdd010835 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 17:53:13 +0530 Subject: [PATCH 41/65] Update __init__.py From 06c79a2c53a4e8c9c0d36347d63d5b2364ac811c Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 18:25:59 +0530 Subject: [PATCH 42/65] Update python-app.yml --- .github/workflows/python-app.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index bc10ff5..e697f35 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -19,7 +19,8 @@ jobs: - name: Install Python packages run: | python -m pip install --upgrade pip - pip install rbiparser + python -m pip install --upgrade rbiparser + - name: Execute Python script run: | From 4a7a5d353d796507ae4aa24b7df3b013ab212a86 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 18:26:24 +0530 Subject: [PATCH 43/65] Update main.yml --- .github/workflows/main.yml | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 74ffd3b..f44508f 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -19,7 +19,8 @@ jobs: - name: Install Python packages run: | python -m pip install --upgrade pip - pip install rbiparser + python -m pip install --upgrade rbiparser + - name: Execute Python script run: | From 5c58415aab06d6ed06be95209241d5e558830ffe Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 18:57:24 +0530 Subject: [PATCH 44/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index f44508f..8d8b9c2 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -14,7 +14,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.10' + python-version: '3.11.2' - name: Install Python packages run: | From 4400f37315909ef2dbbc0b5279e069b7aead415e Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 20:01:06 +0530 Subject: [PATCH 45/65] Update __init__.py --- rbiparser/__init__.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index 74234b6..b172514 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -77,7 +77,7 @@ def get_sheet_urls(url): # Extract the urls. s = soup(r.content, "lxml") - links = s.find_all("a", href=re.compile(".\.xls.")) + links = s.findall("a", href=re.compile(".\.xls.")) if len(links) < 1: raise Exception("Couldn't find any .xlsx urls") From 993acb7b86f0e9ae75130b3c94d9913911909230 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Wed, 29 Nov 2023 21:05:41 +0530 Subject: [PATCH 46/65] Update main.yml --- .github/workflows/main.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 8d8b9c2..7b8fa49 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -26,6 +26,7 @@ jobs: run: | echo "Checking current directory contents:" ls -al + pwd echo "Running rbiparser download -d "./xls":" rbiparser download -d "./xls" From 6971bc4e0fcc54bb832ef9ec039e2fe8dae97d85 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 09:40:26 +0530 Subject: [PATCH 47/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 7b8fa49..0c5d7ff 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -14,7 +14,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.11.2' + python-version: '3.11.0' - name: Install Python packages run: | From 47ddddf23bd54ea8a79cdd4f5de9c3d365d8f756 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 09:40:41 +0530 Subject: [PATCH 48/65] Update python-app.yml --- .github/workflows/python-app.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index e697f35..c773c9a 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -14,7 +14,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.10' + python-version: '3.11.0' - name: Install Python packages run: | From 10fa58dd34d604ee154fc49854ae27314d2f16f5 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 10:03:49 +0530 Subject: [PATCH 49/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 0c5d7ff..a895d08 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -2,7 +2,7 @@ name: Run main.py every 2 minutes on: schedule: - - cron: '*/2 * * * *' # At every 2nd minute of every hour + - cron: '*/10 * * * *' # At every 2nd minute of every hour jobs: build: From ed57097670c7c425477156d265f3e2c4e5f8d9c0 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 10:04:04 +0530 Subject: [PATCH 50/65] Update python-app.yml --- .github/workflows/python-app.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index c773c9a..b88d931 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -2,7 +2,7 @@ name: Run main.py every 2 minutes on: schedule: - - cron: '*/2 * * * *' # At every 2nd minute of every hour + - cron: '*/10 * * * *' # At every 2nd minute of every hour jobs: build: From d3203cdca1f92ff5607466af476a158838e0bf5c Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 10:06:58 +0530 Subject: [PATCH 51/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index a895d08..d3e5f1d 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -14,7 +14,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.11.0' + python-version: '3.10.13' - name: Install Python packages run: | From a03cf53ca26b01e59d8f497c8056310366fadcc0 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 10:07:08 +0530 Subject: [PATCH 52/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index d3e5f1d..6d9b1dd 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -2,7 +2,7 @@ name: Run main.py every 2 minutes on: schedule: - - cron: '*/10 * * * *' # At every 2nd minute of every hour + - cron: '*/4 * * * *' # At every 2nd minute of every hour jobs: build: From a7e43de54584578ac2c3b90eaed9bad4aef1b780 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 10:07:32 +0530 Subject: [PATCH 53/65] Update python-app.yml --- .github/workflows/python-app.yml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index b88d931..e36c221 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -2,7 +2,7 @@ name: Run main.py every 2 minutes on: schedule: - - cron: '*/10 * * * *' # At every 2nd minute of every hour + - cron: '*/4 * * * *' # At every 2nd minute of every hour jobs: build: @@ -14,7 +14,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.11.0' + python-version: '3.10.13' - name: Install Python packages run: | From a1a8436caa1eeffb4b3464d4091e60725cf1c88e Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 10:09:11 +0530 Subject: [PATCH 54/65] Update __init__.py --- rbiparser/__init__.py | 1 + 1 file changed, 1 insertion(+) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index b172514..c2cd4fe 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -79,6 +79,7 @@ def get_sheet_urls(url): s = soup(r.content, "lxml") links = s.findall("a", href=re.compile(".\.xls.")) + if len(links) < 1: raise Exception("Couldn't find any .xlsx urls") From 74363866fb3fcdd520b04d9af46c4b14f5c800f8 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 10:57:41 +0530 Subject: [PATCH 55/65] Update __init__.py --- rbiparser/__init__.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index c2cd4fe..b2615b3 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -77,7 +77,8 @@ def get_sheet_urls(url): # Extract the urls. s = soup(r.content, "lxml") - links = s.findall("a", href=re.compile(".\.xls.")) + links = s.find_all("a", attrs={"href": re.compile(r'\.xls')}) + if len(links) < 1: From c29cf5608691e692921cd4654fdbdd16b0b641ae Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 11:03:07 +0530 Subject: [PATCH 56/65] Update __init__.py --- rbiparser/__init__.py | 28 ++++++++++++++++++---------- 1 file changed, 18 insertions(+), 10 deletions(-) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index b2615b3..0c8f391 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -69,22 +69,30 @@ exclude_words = ["to", "the", "at", "of", "by", "as", "for", "via"] +# ... (previous code) + def get_sheet_urls(url): - """Scrapes the RBI page and gets the list of .xlsx sheets.""" - r = requests.get(url) - if r.status_code != 200: - raise Exception("Invalid response from", url) + """Scrapes the RBI page and gets the list of .xlsx sheets.""" + r = requests.get(url) + if r.status_code != 200: + raise Exception("Invalid response from", url) + + # Extract the HTML content for debugging. + html_content = r.content + print("HTML Content:") + print(html_content) - # Extract the urls. - s = soup(r.content, "lxml") - links = s.find_all("a", attrs={"href": re.compile(r'\.xls')}) + # Extract the urls. + s = soup(html_content, "lxml") + links = s.find_all("a", attrs={"href": re.compile(r'\.xls')}) + if len(links) < 1: + raise Exception("Couldn't find any .xls urls") + return [l["href"] for l in links] - if len(links) < 1: - raise Exception("Couldn't find any .xlsx urls") +# ... (rest of the code) - return [l["href"] for l in links] def convert_xlsx_to_csv(src, target, headers): From 896e71f4639b0083cca8e184374e5d6b7e9be83f Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 11:05:40 +0530 Subject: [PATCH 57/65] Update __init__.py --- rbiparser/__init__.py | 14 ++++++-------- 1 file changed, 6 insertions(+), 8 deletions(-) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index 0c8f391..5fbf284 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -68,9 +68,6 @@ exclude_words = ["to", "the", "at", "of", "by", "as", "for", "via"] - -# ... (previous code) - def get_sheet_urls(url): """Scrapes the RBI page and gets the list of .xlsx sheets.""" r = requests.get(url) @@ -84,14 +81,15 @@ def get_sheet_urls(url): # Extract the urls. s = soup(html_content, "lxml") - links = s.find_all("a", attrs={"href": re.compile(r'\.xls')}) + links = [a["href"] for a in s.find_all("a", href=True)] - if len(links) < 1: - raise Exception("Couldn't find any .xls urls") + # Filter links with ".xls" in the href. + xls_links = [link for link in links if ".xls" in link] - return [l["href"] for l in links] + if len(xls_links) < 1: + raise Exception("Couldn't find any .xls urls") -# ... (rest of the code) + return xls_links From a51f48e0b9bfc2c08437e9dd2eff2e5f6edc8b60 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 11:33:17 +0530 Subject: [PATCH 58/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index 6d9b1dd..e4981aa 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -14,7 +14,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.10.13' + python-version: '3.11.0' - name: Install Python packages run: | From 5050b7ca623c414bdc43200b466c5085ef090c27 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 11:33:34 +0530 Subject: [PATCH 59/65] Update python-app.yml --- .github/workflows/python-app.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/python-app.yml b/.github/workflows/python-app.yml index e36c221..7504afd 100644 --- a/.github/workflows/python-app.yml +++ b/.github/workflows/python-app.yml @@ -14,7 +14,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.10.13' + python-version: '3.11.0' - name: Install Python packages run: | From 8ee19288d90a847a0a53312d32c303319cec139b Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 11:34:20 +0530 Subject: [PATCH 60/65] Update __init__.py --- rbiparser/__init__.py | 29 +++++++++++------------------ 1 file changed, 11 insertions(+), 18 deletions(-) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index 5fbf284..0e5d3a6 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -68,28 +68,21 @@ exclude_words = ["to", "the", "at", "of", "by", "as", "for", "via"] -def get_sheet_urls(url): - """Scrapes the RBI page and gets the list of .xlsx sheets.""" - r = requests.get(url) - if r.status_code != 200: - raise Exception("Invalid response from", url) - - # Extract the HTML content for debugging. - html_content = r.content - print("HTML Content:") - print(html_content) - # Extract the urls. - s = soup(html_content, "lxml") - links = [a["href"] for a in s.find_all("a", href=True)] +def get_sheet_urls(url): + """Scrapes the RBI page and gets the list of .xlsx sheets.""" + r = requests.get(url) + if r.status_code != 200: + raise Exception("Invalid response from", url) - # Filter links with ".xls" in the href. - xls_links = [link for link in links if ".xls" in link] + # Extract the urls. + s = soup(r.content, "lxml") + links = s.find_all("a", href=re.compile(".\.xls.")) - if len(xls_links) < 1: - raise Exception("Couldn't find any .xls urls") + if len(links) < 1: + raise Exception("Couldn't find any .xlsx urls") - return xls_links + return [l["href"] for l in links] From 5c0e207e8a44bda10bc50aefa52e451538e449fa Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 12:09:36 +0530 Subject: [PATCH 61/65] Update __init__.py --- rbiparser/__init__.py | 38 ++++++++++++++++++++++++++++---------- 1 file changed, 28 insertions(+), 10 deletions(-) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index 0e5d3a6..df975cc 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -68,22 +68,40 @@ exclude_words = ["to", "the", "at", "of", "by", "as", "for", "via"] +import requests +from bs4 import BeautifulSoup as soup +import re def get_sheet_urls(url): - """Scrapes the RBI page and gets the list of .xlsx sheets.""" - r = requests.get(url) - if r.status_code != 200: - raise Exception("Invalid response from", url) + """Scrapes the RBI page and gets the list of .xls sheets.""" + try: + r = requests.get(url) + r.raise_for_status() # Raises an HTTPError for bad responses + + # Print the content for inspection + print("Page content:", r.content) + + # Extract the URLs + s = soup(r.content, "html.parser") + links = s.find_all("a", href=re.compile("\.xls$")) + + if len(links) < 1: + raise Exception("Couldn't find any .xls URLs") + + return [l["href"] for l in links] - # Extract the urls. - s = soup(r.content, "lxml") - links = s.find_all("a", href=re.compile(".\.xls.")) + except Exception as e: + print("Error:", e) + return [] - if len(links) < 1: - raise Exception("Couldn't find any .xlsx urls") +# Example URL +example_url = "https://example.com/rbi_page" - return [l["href"] for l in links] +# Get sheet URLs +sheet_urls = get_sheet_urls(example_url) +# Print the result +print("Sheet URLs:", sheet_urls) def convert_xlsx_to_csv(src, target, headers): From 2c6ea3e819af9f41559f378b24bfadd6dcca2883 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 13:06:10 +0530 Subject: [PATCH 62/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index e4981aa..d6de45f 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -14,7 +14,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '3.11.0' + python-version: '2.7' - name: Install Python packages run: | From c7ffe75a4513e4070c14bac255bc5bd71997b490 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 13:10:14 +0530 Subject: [PATCH 63/65] Update __init__.py --- rbiparser/__init__.py | 53 +++++++++++++++++++++++-------------------- 1 file changed, 29 insertions(+), 24 deletions(-) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index df975cc..db56d07 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -24,6 +24,10 @@ import os import glob import string +import requests +from bs4 import BeautifulSoup as soup +import re + try: from urlparse import urlparse @@ -68,40 +72,41 @@ exclude_words = ["to", "the", "at", "of", "by", "as", "for", "via"] -import requests -from bs4 import BeautifulSoup as soup -import re - def get_sheet_urls(url): - """Scrapes the RBI page and gets the list of .xls sheets.""" + """Scrapes the RBI page and gets the list of .xlsx sheets.""" try: - r = requests.get(url) - r.raise_for_status() # Raises an HTTPError for bad responses + # Adding headers to mimic a web browser + headers = { + "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.3029.110 Safari/537.3" + } - # Print the content for inspection - print("Page content:", r.content) + # Making the request with headers and increased timeout + r = requests.get(url, headers=headers, timeout=10) + r.raise_for_status() # Raises an HTTPError if the HTTP request returned an unsuccessful status code - # Extract the URLs - s = soup(r.content, "html.parser") - links = s.find_all("a", href=re.compile("\.xls$")) + # Extract the urls. + s = soup(r.content, "lxml") + links = s.find_all("a", href=re.compile(r"\.xls.")) if len(links) < 1: - raise Exception("Couldn't find any .xls URLs") + raise Exception("Couldn't find any .xlsx urls") return [l["href"] for l in links] - except Exception as e: - print("Error:", e) - return [] - -# Example URL -example_url = "https://example.com/rbi_page" + except requests.exceptions.RequestException as e: + # Print detailed error information + print("Error making request:", e) + print("Response status code:", r.status_code) + print("Response content:", r.content) + raise -# Get sheet URLs -sheet_urls = get_sheet_urls(example_url) - -# Print the result -print("Sheet URLs:", sheet_urls) +# Example usage +url = "https://example.com/rbi_page" +try: + sheet_urls = get_sheet_urls(url) + print("List of .xlsx sheet URLs:", sheet_urls) +except Exception as e: + print("An error occurred:", e) def convert_xlsx_to_csv(src, target, headers): From 01d1ac46a448188ab7f3e6ad7c210fcdeecd82ab Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 13:23:33 +0530 Subject: [PATCH 64/65] Update main.yml --- .github/workflows/main.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml index d6de45f..e4981aa 100644 --- a/.github/workflows/main.yml +++ b/.github/workflows/main.yml @@ -14,7 +14,7 @@ jobs: - name: Setup Python uses: actions/setup-python@v4 with: - python-version: '2.7' + python-version: '3.11.0' - name: Install Python packages run: | From e69b5dcd904a891a7d15f69dde8f3a7030c5bc88 Mon Sep 17 00:00:00 2001 From: 19121A05E5 <86068887+19121A05E5@users.noreply.github.com> Date: Thu, 30 Nov 2023 13:50:52 +0530 Subject: [PATCH 65/65] Update __init__.py --- rbiparser/__init__.py | 50 +++++++++++-------------------------------- 1 file changed, 13 insertions(+), 37 deletions(-) diff --git a/rbiparser/__init__.py b/rbiparser/__init__.py index db56d07..3960182 100644 --- a/rbiparser/__init__.py +++ b/rbiparser/__init__.py @@ -24,9 +24,6 @@ import os import glob import string -import requests -from bs4 import BeautifulSoup as soup -import re try: @@ -73,40 +70,19 @@ exclude_words = ["to", "the", "at", "of", "by", "as", "for", "via"] def get_sheet_urls(url): - """Scrapes the RBI page and gets the list of .xlsx sheets.""" - try: - # Adding headers to mimic a web browser - headers = { - "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.3029.110 Safari/537.3" - } - - # Making the request with headers and increased timeout - r = requests.get(url, headers=headers, timeout=10) - r.raise_for_status() # Raises an HTTPError if the HTTP request returned an unsuccessful status code - - # Extract the urls. - s = soup(r.content, "lxml") - links = s.find_all("a", href=re.compile(r"\.xls.")) - - if len(links) < 1: - raise Exception("Couldn't find any .xlsx urls") - - return [l["href"] for l in links] - - except requests.exceptions.RequestException as e: - # Print detailed error information - print("Error making request:", e) - print("Response status code:", r.status_code) - print("Response content:", r.content) - raise - -# Example usage -url = "https://example.com/rbi_page" -try: - sheet_urls = get_sheet_urls(url) - print("List of .xlsx sheet URLs:", sheet_urls) -except Exception as e: - print("An error occurred:", e) + """Scrapes the RBI page and gets the list of .xlsx sheets.""" + r = requests.get(url) + if r.status_code != 200: + raise Exception("Invalid response from", url) + + # Extract the urls. + s = soup(r.content, "lxml") + links = s.find_all("a", href=re.compile(".\.xls.")) + + if len(links) < 1: + raise Exception("Couldn't find any .xlsx urls") + + return [l["href"] for l in links] def convert_xlsx_to_csv(src, target, headers):