-
Notifications
You must be signed in to change notification settings - Fork 7.7k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
* fix(route): zaker * refactor(zaker/utils): update API URLs
- Loading branch information
Showing
4 changed files
with
269 additions
and
80 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,44 @@ | ||
import { Route } from '@/types'; | ||
import cache from '@/utils/cache'; | ||
import * as cheerio from 'cheerio'; | ||
import { baseUrl, fetchItem, getSafeLineCookieWithData, parseList } from './utils'; | ||
import asyncPool from 'tiny-async-pool'; | ||
|
||
export const route: Route = { | ||
path: '/channel/:id?', | ||
parameters: { | ||
id: '分类 ID,可在 URL 中找到,默认为 `1`', | ||
}, | ||
radar: [ | ||
{ | ||
source: ['www.myzaker.com/channel/:id'], | ||
target: '/channel/:id', | ||
}, | ||
], | ||
name: '分类', | ||
example: '/zaker/channel/13', | ||
maintainers: ['LogicJake', 'kt286', 'TonyRL'], | ||
handler, | ||
}; | ||
|
||
async function handler(ctx) { | ||
const id = ctx.req.param('id') ?? 1; | ||
const link = `${baseUrl}/channel/${id}`; | ||
|
||
const { cookie, data } = await getSafeLineCookieWithData(link); | ||
|
||
const $ = cheerio.load(data); | ||
const feedTitle = $('head title').text(); | ||
const list = parseList($); | ||
|
||
const items = []; | ||
for await (const item of asyncPool(2, list, (item) => cache.tryGet(item.link!, () => fetchItem(item, cookie)))) { | ||
items.push(item); | ||
} | ||
|
||
return { | ||
title: feedTitle, | ||
link, | ||
item: items, | ||
}; | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
import { Route } from '@/types'; | ||
import cache from '@/utils/cache'; | ||
import * as cheerio from 'cheerio'; | ||
import asyncPool from 'tiny-async-pool'; | ||
import { baseUrl, fetchItem, getSafeLineCookieWithData, parseList } from './utils'; | ||
|
||
export const route: Route = { | ||
path: '/focusread', | ||
radar: [ | ||
{ | ||
source: ['www.myzaker.com/'], | ||
target: '/focusread', | ||
}, | ||
], | ||
name: '精读', | ||
example: '/zaker/focusread', | ||
maintainers: ['AlexdanerZe', 'TonyRL'], | ||
handler, | ||
}; | ||
|
||
async function handler() { | ||
const link = `${baseUrl}/?pos=selected_article`; | ||
|
||
const { cookie, data } = await getSafeLineCookieWithData(link); | ||
|
||
const $ = cheerio.load(data); | ||
const list = parseList($); | ||
|
||
const items = []; | ||
for await (const item of asyncPool(2, list, (item) => cache.tryGet(item.link!, () => fetchItem(item, cookie)))) { | ||
items.push(item); | ||
} | ||
|
||
return { | ||
title: 'ZAKER 精读新闻', | ||
link, | ||
item: items, | ||
}; | ||
} |
This file was deleted.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,186 @@ | ||
import { DataItem } from '@/types'; | ||
|
||
import CryptoJS from 'crypto-js'; | ||
import cache from '@/utils/cache'; | ||
import ofetch from '@/utils/ofetch'; | ||
import { config } from '@/config'; | ||
import logger from '@/utils/logger'; | ||
import * as cheerio from 'cheerio'; | ||
import { parseDate } from '@/utils/parse-date'; | ||
import timezone from '@/utils/timezone'; | ||
|
||
const hints = ['globalThis', 'headless', 'languages', 'permHook', 'vendor', 'webDriverValue', 'webdriver']; | ||
export const baseUrl = 'https://www.myzaker.com'; | ||
|
||
const generateSalt = (input: string, targetZeros = 20) => { | ||
for (let nonce = 0; nonce < 100_000_000; nonce++) { | ||
const hash = CryptoJS.SHA256(input + nonce).toString(); | ||
let leadingZeros = 0; | ||
|
||
for (const char of hash) { | ||
if (char !== '0') { | ||
leadingZeros += 4 - Number.parseInt(char, 16).toString(2).length; | ||
break; | ||
} | ||
leadingZeros += 4; | ||
} | ||
|
||
if (leadingZeros >= targetZeros) { | ||
return nonce; | ||
} | ||
} | ||
return 0; | ||
}; | ||
|
||
const padSeed = (seed: string) => { | ||
const padding = '0'.repeat(16); | ||
return CryptoJS.enc.Utf8.parse((seed + padding).slice(0, 16)); | ||
}; | ||
|
||
const encrypt = (data, seed: string) => { | ||
const iv = CryptoJS.enc.Utf8.parse('1234567890123456'); | ||
return CryptoJS.AES.encrypt(JSON.stringify(data), padSeed(seed), { | ||
iv, | ||
padding: CryptoJS.pad.Pkcs7, | ||
}); | ||
}; | ||
|
||
const encryptPayload = (data, seed: string) => encrypt(data, seed).ciphertext.toString(); | ||
|
||
export const getSafeLineCookieWithData = async (link): Promise<{ cookie: string; data: string }> => { | ||
const cacheKey = 'zaker:cookie'; | ||
const cacheAge = 3600; | ||
const cacheIn = await cache.get(cacheKey, false); | ||
if (cacheIn) { | ||
return JSON.parse(cacheIn); | ||
} | ||
const apiBaseUrl = 'https://challenge.rivers.chaitin.cn/captcha/api'; | ||
|
||
const headerResponse = await ofetch.raw(link); | ||
const session = headerResponse.headers | ||
.getSetCookie() | ||
.find((e) => e.startsWith('sl-session')) | ||
?.split(';')[0] | ||
.split('sl-session=')[1]; | ||
const onceId = headerResponse._data.match(/once_id:\s*"(.*?)",/)?.[1]; | ||
logger.debug(`getSafeLineCookie: sl-session=${session}, onceId=${onceId}`); | ||
if (!/window\.captcha/.test(headerResponse._data)) { | ||
logger.debug('getSafeLineCookie: Failed to get once_id'); | ||
return { | ||
cookie: headerResponse.headers | ||
.getSetCookie() | ||
.map((c) => c.split(';')[0]) | ||
.join('; '), | ||
data: headerResponse._data, | ||
}; | ||
} | ||
|
||
// await ofetch(`${apiBaseUrl}/index.html?${Math.random()}`); | ||
// await ofetch('${apiBaseUrl}/sdk.js'); | ||
const seedResponse = await ofetch<{ req_id: string; seed: string }>(`${apiBaseUrl}/seed`, { | ||
headers: { | ||
Referer: `${baseUrl}/`, | ||
}, | ||
query: { | ||
once_id: onceId, | ||
v: '1.0.0', | ||
hints: hints.sort(() => Math.random() - 0.5).join(','), | ||
}, | ||
}); | ||
|
||
const ua = config.ua; | ||
const seed = seedResponse.seed; | ||
const takeTime = Math.trunc(Math.random() * 2000 + 1000); | ||
logger.debug(`getSafeLineCookie: ua=${ua}, seed=${seed}, takeTime=${takeTime}`); | ||
const payload = encryptPayload( | ||
{ | ||
resolution: '1920x1080', | ||
languages: ['en-US'], | ||
useragents: [ua, ua, ua], | ||
hint: 0, | ||
salt: String(generateSalt(seed, 16)), | ||
taketime: takeTime, | ||
}, | ||
seed | ||
); | ||
|
||
const inspectResponse = await ofetch<{ req_id: string; jwt: string; reason: string }>(`${apiBaseUrl}/inspect`, { | ||
method: 'POST', | ||
headers: { | ||
Referer: `${baseUrl}/`, | ||
'Content-Type': 'text/plain', | ||
}, | ||
query: { | ||
seed, | ||
}, | ||
body: payload, | ||
}); | ||
logger.debug(`getSafeLineCookie: inspectResponse=${JSON.stringify(inspectResponse)}`); | ||
if (inspectResponse.reason) { | ||
logger.error(`getSafeLineCookie: reason=${inspectResponse.reason}`); | ||
return { | ||
cookie: headerResponse.headers | ||
.getSetCookie() | ||
.map((c) => c.split(';')[0]) | ||
.join('; '), | ||
data: headerResponse._data, | ||
}; | ||
} | ||
|
||
const response = await ofetch.raw(link, { | ||
headers: { | ||
Cookie: `sl-session=${session}; sl_waf_recap=${inspectResponse.jwt}`, | ||
}, | ||
}); | ||
|
||
const cookie = response.headers | ||
.getSetCookie() | ||
.map((c) => c.split(';')[0]) | ||
.join('; '); | ||
logger.debug(`getSafeLineCookie: ${cookie}`); | ||
|
||
cache.set(cacheKey, JSON.stringify(cookie), cacheAge); | ||
return { | ||
cookie, | ||
data: response._data, | ||
}; | ||
}; | ||
|
||
export const parseList = ($: cheerio.CheerioAPI) => { | ||
const winPageData = JSON.parse( | ||
$('script:contains("window.WinPageData")') | ||
.text() | ||
.match(/window\.WinPageData\s*=\s*({.*})/)?.[1] ?? '{}' | ||
); | ||
|
||
return winPageData.data.article.map((item) => ({ | ||
title: item.title, | ||
description: item.desc, | ||
link: 'https:' + item.url, | ||
author: item.author_name, | ||
pubDate: timezone(parseDate(item.date, 'MM月DD日'), +8), | ||
category: item.tag.map((t) => t.tag), | ||
image: item.thumbnail_mpic, | ||
})) as DataItem[]; | ||
}; | ||
|
||
export const fetchItem = async (item: DataItem, cookie: string) => { | ||
const response = await ofetch(item.link!, { | ||
headers: { | ||
Cookie: cookie as string, | ||
}, | ||
}); | ||
|
||
const $ = cheerio.load(response); | ||
|
||
const content = $('div.article_content div'); | ||
content.find('img').each((_, img) => { | ||
const $img = $(img); | ||
$img.attr('src', $img.attr('data-original')); | ||
$img.removeAttr('data-original'); | ||
}); | ||
|
||
item.description = content.html(); | ||
|
||
return item; | ||
}; |