#!/usr/bin/env python3
# Web Automation Service - Main Script
import os
import sys
from pathlib import Path
from datetime import datetime
SCRIPT_DIR = Path(__file__).parent.resolve()
OUTPUT_DIR = SCRIPT_DIR / "output"
def scrape_web(url):
"""抓取网页"""
try:
import requests
response = requests.get(url, timeout=10)
report = f"# Web Scraping Report: {url}\n\n"
report += f"**Generated:** {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}\n\n"
report += f"## Scraping Results\n\n"
report += f"- URL: {url}\n"
report += f"- Status Code: {response.status_code}\n"
report += f"- Content Length: {len(response.text)} bytes\n\n"
# Extract title
import re
title_match = re.search(r'
(.*?)', response.text)
if title_match:
report += f"**Page Title:** {title_match.group(1)}\n\n"
# Extract links
links = re.findall(r'href="([^"]+)"', response.text)
report += f"**Found {len(links)} links**\n\n"
output_file = OUTPUT_DIR / f"scrape_{datetime.now().strftime('%Y%m%d_%H%M%S')}.md"
OUTPUT_DIR.mkdir(parents=True, exist_ok=True)
output_file.write_text(report, encoding='utf-8')
return str(output_file)
except Exception as e:
return f"Error: {str(e)}"
def main():
if len(sys.argv) < 3:
print("Usage: python3 main.py [options]")
print("\nActions:")
print(" scrape - Scrape web page")
print("\nExamples:")
print(" python3 main.py scrape https://example.com")
sys.exit(1)
action = sys.argv[1]
url = sys.argv[2]
if action == "scrape":
result = scrape_web(url)
print(f"Scraping saved to: {result}")
else:
print(f"Unknown action: {action}")
sys.exit(1)
if __name__ == "__main__":
main()