TrendRadar/.github/workflows/crawler.yml

119 lines
4.3 KiB
YAML
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

name: Hot News Crawler
on:
schedule:
# ⚠️ 重要提示:我们使用的是 GitHub 官方提供的资源来进行的推送,而每个账号的资源是限额的
# 为了不被官方判定为滥用而面临封号的风险,不建议设置比半小时更短的执行间隔
#
# Cron 表达式示例注意GitHub Actions 使用 UTC 时间,北京时间需要减 8 小时):
# - "0 * * * *" # 每小时整点运行一次(实际有偏差)
# - "*/30 * * * *" # 每 30 分钟执行一次
# - "*/30 0-14 * * *" # 每天 UTC 0:00-14:00北京时间 8:00-22:00每 30 分钟运行一次
# - "0 0,6,12,18 * * *" # 每天 UTC 0:00,6:00,12:00,18:00北京时间 8:00,14:00,20:00,次日2:00
- cron: "0 * * * *"
workflow_dispatch:
concurrency:
group: crawler-${{ github.ref_name }}
cancel-in-progress: true
permissions:
contents: write
jobs:
crawl:
runs-on: ubuntu-latest
timeout-minutes: 30
steps:
- name: Checkout repository
uses: actions/checkout@v3
with:
fetch-depth: 0
clean: true
- name: Set up Python
uses: actions/setup-python@v4
with:
python-version: "3.10"
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install -r requirements.txt
- name: Verify required files
run: |
echo "🔍 检查必需的配置文件..."
if [ ! -f config/config.yaml ]; then
echo "❌ 错误: config/config.yaml 文件不存在"
exit 1
fi
if [ ! -f config/frequency_words.txt ]; then
echo "❌ 错误: config/frequency_words.txt 文件不存在"
exit 1
fi
echo "✅ 配置文件检查通过"
- name: Run crawler
env:
FEISHU_WEBHOOK_URL: ${{ secrets.FEISHU_WEBHOOK_URL }}
TELEGRAM_BOT_TOKEN: ${{ secrets.TELEGRAM_BOT_TOKEN }}
TELEGRAM_CHAT_ID: ${{ secrets.TELEGRAM_CHAT_ID }}
DINGTALK_WEBHOOK_URL: ${{ secrets.DINGTALK_WEBHOOK_URL }}
WEWORK_WEBHOOK_URL: ${{ secrets.WEWORK_WEBHOOK_URL }}
WEWORK_MSG_TYPE: ${{ secrets.WEWORK_MSG_TYPE }}
EMAIL_FROM: ${{ secrets.EMAIL_FROM }}
EMAIL_PASSWORD: ${{ secrets.EMAIL_PASSWORD }}
EMAIL_TO: ${{ secrets.EMAIL_TO }}
EMAIL_SMTP_SERVER: ${{ secrets.EMAIL_SMTP_SERVER }}
EMAIL_SMTP_PORT: ${{ secrets.EMAIL_SMTP_PORT }}
NTFY_TOPIC: ${{ secrets.NTFY_TOPIC }}
NTFY_SERVER_URL: ${{ secrets.NTFY_SERVER_URL }}
NTFY_TOKEN: ${{ secrets.NTFY_TOKEN }}
BARK_URL: ${{ secrets.BARK_URL }}
SLACK_WEBHOOK_URL: ${{ secrets.SLACK_WEBHOOK_URL }}
GITHUB_ACTIONS: true
run: python main.py
- name: Commit and push if changes
env:
BRANCH_NAME: ${{ github.event.repository.default_branch }}
run: |
git config --global user.name 'GitHub Actions'
git config --global user.email 'actions@github.com'
echo "🔄 Syncing with remote (branch: $BRANCH_NAME)..."
git fetch origin $BRANCH_NAME
# 保存当前更改
git stash --include-untracked || echo "Nothing to stash"
# 同步到远程最新
git reset --hard origin/$BRANCH_NAME
# 恢复本次更改
git stash pop || echo "Nothing to pop"
git add -A
if git diff --quiet && git diff --staged --quiet; then
echo "📭 No changes to commit"
exit 0
fi
echo "📝 Committing changes..."
TIMESTAMP=$(TZ=Asia/Shanghai date "+%Y-%m-%d %H:%M:%S")
git commit -m "Auto update by GitHub Actions at $TIMESTAMP"
echo "⬆️ Pushing changes with retry..."
for i in {1..5}; do
git pull --rebase origin $BRANCH_NAME && git push origin $BRANCH_NAME && {
echo "✅ Successfully pushed on attempt $i"
exit 0
}
echo "⚠️ Attempt $i failed, waiting $((i*3)) seconds..."
sleep $((i * 3))
done
echo "❌ Failed to push after 5 attempts"
exit 1