網路爬蟲

shie · 發表於 2026-3-3 11:36:46

# -*- coding: utf-8 -*-
"""
Created on Tue Mar  3 11:26:32 2026

@author: AEUST
"""

import requests
from bs4 import BeautifulSoup

url = 'https://www.ptt.cc/'
web = requests.get('https://www.ptt.cc/bbs/AllTogether/index.html', cookies={'over18':'1'})
soup = BeautifulSoup(web.text, "html.parser")
titles = soup.find_all('div', class_='title')    # 取得 class 為 title 的 div 內容
for i in titles:
if i.find('a') != None:                      # 判斷如果不為 None
      print(i.find('a').get_text())                # 取得 div 裡 a 的內容，使用 get_text() 取得文字
      print(url + i.find('a')['href'], end='\n\n')  # 使用 ['href'] 取得 href 的屬性

print("123456789  施勢帆")

		自動登錄	找回密碼
密碼			立即註冊

網路爬蟲

瀏覽過的版塊