pypi.org/

 

PyPI · The Python Package Index

The Python Package Index (PyPI) is a repository of software for the Python programming language.

pypi.org


 

pip install requests 
requests 패키지 설치됐음
파이참 터미널에서 설치해도 됨 
requests 들어와있음 
+ 클릭 - bs4 다운

 

파일 만들기 

import requests

url = 'https://movie.naver.com/movie/running/current.nhn'
response = requests.get(url) #웹페이지의 내용을 가져옴
print(response.text) #텍스트로 출력함

자바스크립트 코드로 가져왔음

 

 

 

 

 

 

 

import requests
from bs4 import BeautifulSoup

url = 'https://www.ymori.com/books/python2nen/test1.html'
response = requests.get(url)
soup = BeautifulSoup(response.content, "html.parser")
title = soup.find("title")
jang = soup.find("h2")
li = soup.find("li")

print(title)
print(jang)
print(li)

결과

 

 

 

import requests
from bs4 import BeautifulSoup
import urllib

url = 'https://www.ymori.com/books/python2nen/test2.html'
response = requests.get(url)
soup = BeautifulSoup(response.content, "html.parser")
for element in soup.find_all("img"):
    src = element.get("src")
    image_url = urllib.parse.urljoin(url, src)
    filename = image_url.split("/")[-1]
    print(image_url, ">>", filename)

 

-사진 저장하기 

import requests
from bs4 import BeautifulSoup
import urllib
from pathlib import Path
import time


url = 'https://www.ymori.com/books/python2nen/test2.html'
response = requests.get(url)
soup = BeautifulSoup(response.content, "html.parser")

out_folder = Path("download2")
out_folder.mkdir(exist_ok=True)

for element in soup.find_all("img"):
    src = element.get("src")
    image_url = urllib.parse.urljoin(url, src)
    imgdata = requests.get(image_url)

    filename = image_url.split("/")[-1]
    out_path = out_folder.joinpath(filename)

    with open(out_path, mode="wb") as f:
        f.write(imgdata.content)
    time.sleep(1)

저장됐음

 

+ Recent posts