updated yaml #6
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Deploy and Parse | |
on: | |
workflow_dispatch: | |
push: | |
branches: | |
- main | |
jobs: | |
deploy: | |
runs-on: ubuntu-latest | |
steps: | |
- name: Checkout repository | |
uses: actions/checkout@v3 | |
with: | |
fetch-depth: 0 | |
- uses: actions/setup-python@v4 | |
with: | |
python-version: "3.10" | |
- name: Install Python dependencies | |
run: | | |
pip install \ | |
"wheel" \ | |
"lxml" \ | |
"mkdocs-material" \ | |
"cairosvg>=2.5" \ | |
"mkdocs-git-committers-plugin-2>=1.1.1" \ | |
"mkdocs-git-revision-date-localized-plugin>=1.0" \ | |
"mkdocs-minify-plugin>=0.3" \ | |
"mkdocs-rss-plugin>=1.2" \ | |
"mkdocs-redirects>=1.0" \ | |
"pillow<10" | |
- name: Sync markdown with script | |
run: python mdown_copy.py | |
- name: Deploy documentation | |
env: | |
GH_TOKEN: ${{ secrets.GITHUB_TOKEN }} | |
run: | | |
mkdocs gh-deploy --force | |
mkdocs --version | |
build: | |
runs-on: ubuntu-latest | |
needs: deploy | |
steps: | |
- uses: actions/checkout@v3 | |
- uses: actions/setup-python@v4 | |
with: | |
python-version: "3.8" | |
- name: upgrade pip and install python packages | |
run: | | |
python -m pip install --upgrade pip | |
pip install -U pip setuptools | |
pip install requests | |
pip install beautifulsoup4 | |
pip install pandas | |
pip install lxml | |
pip install html5lib | |
- name: output_render | |
uses: jannekem/run-python-script-action@v1 | |
with: | |
script: | | |
import csv | |
import json | |
import requests | |
from bs4 import BeautifulSoup | |
url = "https://ladiesoflandsat.github.io/LOLManuscriptMonday/" | |
response = requests.get(url) | |
key_order = ["Week", "Date", "Name","Article Title","Article Link","Twitter Handle","MM Tweet","Key Words"] | |
if response.status_code == 200: | |
soup = BeautifulSoup(response.text, 'html.parser') | |
table = soup.find('table') | |
if table: | |
table_data = [] | |
rows = table.find_all('tr') | |
headers = [header.text.strip() for header in rows[0].find_all('th')] | |
for row in rows[1:]: | |
row_data = {} | |
columns = row.find_all('td') | |
for i in range(len(headers)): | |
row_data[headers[i]] = columns[i].text.strip() | |
row_data = {key: row_data[key] for key in key_order if key in row_data} | |
table_data.append(row_data) | |
with open('sorted_data.json', 'w') as json_file: | |
json.dump(table_data, json_file, indent=2) | |
column_headers = key_order | |
csv_file_name = "output.csv" | |
with open(csv_file_name, mode="w", newline="", encoding="utf-8") as csv_file: | |
writer = csv.DictWriter(csv_file, fieldnames=column_headers) | |
writer.writeheader() | |
for data in table_data: | |
writer.writerow(data) | |
print(f"Data has been written to {csv_file_name}.") | |
else: | |
print("No table found on the web page.") | |
else: | |
print(f"Failed to fetch web page. Status code: {response.status_code}") | |
- name: commit files | |
continue-on-error: true | |
run: | | |
today=$(date +"%Y-%m-%d") | |
git config --local user.email "[email protected]" | |
git config --local user.name "GitHub Action" | |
git add -A | |
git commit -m "updated datasets ${today} UTC" -a | |
- name: push changes | |
continue-on-error: true | |
uses: ad-m/[email protected] | |
with: | |
github_token: ${{ secrets.GITHUB_TOKEN }} | |
branch: main |