Programming/nodejs

[NodeJS] 넷폴릭스 크롤링

낭강 2021. 10. 3. 01:50
var express = require('express');
var router = express.Router();
 
const axios = require("axios");
const cheerio = require("cheerio");
var html = "";
let movie = [];
async function getHTML(){
    try{
        console.log("getHtml");
        return await axios.get("https://www.netflix.com/kr/browse/genre/34399");
    }catch(err){
        console.log(err);
    }
}

async function parsing(){
    html = await getHTML();
    const $ = cheerio.load(html.data);
    const $rankList = $(".nm-collections-row");
     
    console.log($rankList.length);
    $rankList.each((idx,node)=>{
        if($(node).find("h2").text()==="Netflix 인기 콘텐츠"){
            $(node).find("li").each((i,s)=>{ 
                movie.push({
                    title:$(s).find("span.nm-collections-title-name").text(),
                    image:$(s).find("img.nm-collections-title-img").attr('src')
                }); 
        });
        }
    }); 
    return movie;
}
parsing();
router.get('/', function(req, res,next) {
    res.send(movie);
  }); 

  module.exports = router;

이후 설명추가예정