Compare text

Find the difference between two text files

Real-time editor

Hide unchanged lines

Disable line wrap

Layout

Diff precision

Syntax highlighting

Diffchecker Desktop The most secure way to run Diffchecker. Get the Diffchecker Desktop app: your diffs never leave your computer!Get Desktop

3주차 과제 비교

Created 4 years agoDiff never expires

12 removals

Lines
Total
Removed

Characters
Total
Removed

To continue using this feature, upgrade to Diffchecker Pro View Pricing

15 lines

25 additions

Lines
Total
Added

Characters
Total
Added

To continue using this feature, upgrade to Diffchecker Pro View Pricing

29 lines

## 웹 크롤링에 필요한 세팅: requests와 bs4 패키지

import requests

from bs4 import BeautifulSoup

headers = {'User-Agent' : 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)AppleWebKit/537.36 (KHTML, like Gecko) Chrome/73.0.3683.86 Safari/537.36'}

data = requests.get('https://www.genie.co.kr/chart/top200?ditc=M&rtm=N&ymd=20210701',headers=headers)

soup = BeautifulSoup(data.text, 'html.parser')

trs = soup.select('#body-content > div.newest-list > div > table > tbody > tr')

## 지니뮤직의 1~50위 곡의 순위/곡명/가수를 스크래핑해보자

# 순위

#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.number

# 곡명

#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.info > a.title.ellipsis

# 가수

#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.info > a.artist.ellipsis

# 공통부분:

#body-content > div.newest-list > div > table > tbody > tr

for tr in trs:

title = tr.select_one('td.info > a.title.ellipsis').text.strip()

# 최종 정리:

rank = tr.select_one('td.number').text[0:2].strip()

musics = list(soup.select("#body-content > div.newest-list > div > table > tbody > tr"))

artist = tr.select_one('td.info > a.artist.ellipsis').text

for music in musics:

rank = music.select_one("td.number").text[:2].replace('\n', ' ')

title = music.select_one("td.info > a.title.ellipsis").text.strip()

artist = music.select_one("td.info > a.artist.ellipsis").text.strip()

print(rank, title, artist)

Saved diffs

Original text

Open file

Changed text

Open file

## 웹 크롤링에 필요한 세팅: requests와 bs4 패키지
import requests
from bs4 import BeautifulSoup
headers = {'User-Agent' : 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)AppleWebKit/537.36 (KHTML, like Gecko) Chrome/73.0.3683.86 Safari/537.36'}
data = requests.get('https://www.genie.co.kr/chart/top200?ditc=M&rtm=N&ymd=20210701',headers=headers)
soup = BeautifulSoup(data.text, 'html.parser')

## 지니뮤직의 1~50위 곡의 순위/곡명/가수를 스크래핑해보자
# 순위
#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.number
# 곡명
#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.info > a.title.ellipsis
# 가수
#body-content > div.newest-list > div > table > tbody > tr:nth-child(1) > td.info > a.artist.ellipsis
# 공통부분:
#body-content > div.newest-list > div > table > tbody > tr

# 최종 정리:
musics = list(soup.select("#body-content > div.newest-list > div > table > tbody > tr"))
for music in musics:
    rank = music.select_one("td.number").text[:2].replace('\n', ' ')
    title = music.select_one("td.info > a.title.ellipsis").text.strip()
    artist = music.select_one("td.info > a.artist.ellipsis").text.strip()

print(rank, title, artist)