-
Notifications
You must be signed in to change notification settings - Fork 20
/
Copy pathscrapper.js
148 lines (103 loc) · 4.19 KB
/
scrapper.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
const cheerio = require('cheerio');
const axios = require('axios');
const puppeteer = require('puppeteer');
const userAgent = require('user-agents');
// https://www3.gogoanimes.fi/
// https://gogoanime.run
const baseUrl = "https://gogoanime.run"
async function newSeason(page) {
var anime_list = []
res = await axios.get(`${baseUrl}/new-season.html?page=${page}`)
const body = await res.data;
const $ = cheerio.load(body)
$('div.main_body div.last_episodes ul.items li').each((index, element) => {
$elements = $(element)
name = $elements.find('p').find('a')
img = $elements.find('div').find('a').find('img').attr('src')
link = $elements.find('div').find('a').attr('href')
anime_name = { 'name': name.html(), 'img_url': img, 'anime_id': link.slice(10,) }
anime_list.push(anime_name)
})
return await (anime_list)
}
async function popular(page) {
var anime_list = []
res = await axios.get(`${baseUrl}/popular.html?page=${page}`)
const body = await res.data;
const $ = cheerio.load(body)
$('div.main_body div.last_episodes ul.items li').each((index, element) => {
$elements = $(element)
name = $elements.find('p').find('a')
img = $elements.find('div').find('a').find('img').attr('src')
link = $elements.find('div').find('a').attr('href')
anime_name = { 'name': name.html(), 'img_url': img, 'anime_id': link.slice(10,) }
anime_list.push(anime_name)
})
return await (anime_list)
}
async function search(query) {
var anime_list = []
res = await axios.get(`${baseUrl}/search.html?keyword=${query}`)
const body = await res.data;
const $ = cheerio.load(body)
$('div.main_body div.last_episodes ul.items li').each((index, element) => {
$elements = $(element)
name = $elements.find('p').find('a')
img = $elements.find('div').find('a').find('img').attr('src')
link = $elements.find('div').find('a').attr('href')
anime_name = { 'name': name.html(), 'img_url': img, 'anime_id': link.slice(10,) }
anime_list.push(anime_name)
})
return await (anime_list)
}
async function anime(_anime_name) {
episode_array = []
res = await axios.get(`${baseUrl}/category/${_anime_name}`)
const body = await res.data;
const $ = cheerio.load(body)
img_url = $('div.anime_info_body_bg img').attr('src')
anime_name = $('div.anime_info_body_bg h1').text()
anime_about = $('div.main_body div:nth-child(2) > div.anime_info_body_bg > p:nth-child(5)').text()
anime_about = $('div.main_body div:nth-child(2) > div.anime_info_body_bg > p:nth-child(5)').text()
//add the new code here
el = $('#episode_page')
ep_start = 1
ep_end = el.children().last().find('a').text().split("-")[1]
for (let i = ep_start; i <= ep_end; i++) {
episode_array.push(`${_anime_name}-episode-${i}`)
}
anime_result = { 'name': anime_name, 'img_url': img_url, 'about': anime_about, 'episode_id': episode_array }
return await (anime_result)
}
async function watchAnime(episode_id) {
res = await axios.get(`${baseUrl}/${episode_id}`)
const body = await res.data;
$ = cheerio.load(body)
episode_link = $('li.dowloads > a').attr('href')
ep = await getDownloadLink(episode_link)
return await (ep)
}
async function getDownloadLink(episode_link) {
const browser = await puppeteer.launch({ headless: true });
const page = await browser.newPage();
await page.setUserAgent(userAgent.random().toString())
await page.goto(episode_link, { waitUntil: 'networkidle0' });
const links = await page.evaluate(() => {
let ep_links = []
//fetch all links
const ep = document.querySelector(".mirror_link");
ep.querySelectorAll('a').forEach((link)=>{
ep_links.push({"name":link.innerText.split("D ")[1].replace(/[()]/g, ""),"link":link.href})
})
return ep_links
});
await browser.close();
return (links)
}
module.exports = {
popular,
newSeason,
search,
anime,
watchAnime
}