Comparer le texte

Encuentra la diferencia entre dos archivos de texto

Real-time diff

Unified diff

Collapse lines

Highlight change

Syntax highlighting

Outils

Diffchecker Desktop The most secure way to run Diffchecker. Get the Diffchecker Desktop app: your diffs never leave your computer!Get Desktop

3주차 과제 비교

Created 3 years agoDiff never expires

Lines
Total
Removed

Words
Total
Removed

To continue using this feature, upgrade to Diffchecker Pro View Pricing

15 lines

Lines
Total
Added

Words
Total
Added

To continue using this feature, upgrade to Diffchecker Pro View Pricing

29 lines

## 웹 크롤링에 필요한 세팅: requests와 bs4 패키지

import requests

from bs4 import BeautifulSoup

headers = {'User-Agent' : 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)AppleWebKit/537.36 (KHTML, like Gecko) Chrome/73.0.3683.86 Safari/537.36'}

data = requests.get('https://www.genie.co.kr/chart/top200?ditc=M&rtm=N&ymd=20210701',headers=headers)

soup = BeautifulSoup(data.text, 'html.parser')

trs = soup.select('#body-content > div.newest-list > div > table > tbody > tr')

## 지니뮤직의 1~50위 곡의 순위/곡명/가수를 스크래핑해보자

# 순위

#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.number

# 곡명

#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.info > a.title.ellipsis

# 가수

#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.info > a.artist.ellipsis

# 공통부분:

#body-content > div.newest-list > div > table > tbody > tr

for tr in trs:

title = tr.select_one('td.info > a.title.ellipsis').text.strip()

# 최종 정리:

rank = tr.select_one('td.number').text[0:2].strip()

musics = list(soup.select("#body-content > div.newest-list > div > table > tbody > tr"))

artist = tr.select_one('td.info > a.artist.ellipsis').text

for music in musics:

rank = music.select_one("td.number").text[:2].replace('\n', ' ')

title = music.select_one("td.info > a.title.ellipsis").text.strip()

artist = music.select_one("td.info > a.artist.ellipsis").text.strip()

print(rank, title, artist)

Les différences enregistrées

Texte d'origine

Ouvrir un fichier

Texte modifié

Ouvrir un fichier

## 웹 크롤링에 필요한 세팅: requests와 bs4 패키지
import requests
from bs4 import BeautifulSoup
headers = {'User-Agent' : 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)AppleWebKit/537.36 (KHTML, like Gecko) Chrome/73.0.3683.86 Safari/537.36'}
data = requests.get('https://www.genie.co.kr/chart/top200?ditc=M&rtm=N&ymd=20210701',headers=headers)
soup = BeautifulSoup(data.text, 'html.parser')

## 지니뮤직의 1~50위 곡의 순위/곡명/가수를 스크래핑해보자
# 순위
#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.number
# 곡명
#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.info > a.title.ellipsis
# 가수
#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.info > a.artist.ellipsis
# 공통부분:
#body-content > div.newest-list > div > table > tbody > tr

# 최종 정리:
musics = list(soup.select("#body-content > div.newest-list > div > table > tbody > tr"))
for music in musics:
    rank = music.select_one("td.number").text[:2].replace('\n', ' ')
    title = music.select_one("td.info > a.title.ellipsis").text.strip()
    artist = music.select_one("td.info > a.artist.ellipsis").text.strip()

print(rank, title, artist)