mirror of
https://git.luna-app.eu/50n50/sources
synced 2025-12-21 21:26:19 +01:00
232 lines
7.4 KiB
JavaScript
232 lines
7.4 KiB
JavaScript
async function searchResults(keyword) {
|
||
try {
|
||
const encodedKeyword = encodeURIComponent(keyword);
|
||
const url = `https://helioscans.com/series/?q=${encodedKeyword}`;
|
||
const response = await soraFetch(url);
|
||
const html = await response.text();
|
||
|
||
const results = [];
|
||
const regex = /<button[^>]+?title="([^"]+?)"[^>]*?>[\s\S]*?<a href="([^"]+?)"[\s\S]*?background-image:url\(([^)]+)\)/g;
|
||
let match;
|
||
|
||
while ((match = regex.exec(html)) !== null) {
|
||
const title = match[1];
|
||
const href = `https://helioscans.com${match[2]}`;
|
||
const rawImage = match[3].replace(/&/g, "&");
|
||
const image = rawImage.startsWith("http") ? rawImage : `https:${rawImage}`;
|
||
|
||
results.push({ title, href, image });
|
||
}
|
||
|
||
console.log(JSON.stringify(results));
|
||
return JSON.stringify(results);
|
||
} catch (error) {
|
||
console.error("Error fetching or parsing: " + error);
|
||
return JSON.stringify([{
|
||
title: "Error",
|
||
href: "",
|
||
image: ""
|
||
}]);
|
||
}
|
||
}
|
||
extractChapters('https://helioscans.com/series/63a6054296b/');
|
||
|
||
async function extractDetails(url) {
|
||
try {
|
||
const response = await soraFetch(url);
|
||
const htmlText = await response.text();
|
||
|
||
const metaMatch = htmlText.match(/<meta name="description" content="([\s\S]*?)">/i);
|
||
const description = metaMatch
|
||
? metaMatch[1].replace(/\s+/g, ' ').trim()
|
||
: "No description available";
|
||
|
||
const aliases = 'N/A';
|
||
const airdate = 'N/A';
|
||
|
||
const transformedResults = [{
|
||
description,
|
||
aliases,
|
||
airdate
|
||
}];
|
||
|
||
console.log(JSON.stringify(transformedResults));
|
||
return JSON.stringify(transformedResults);
|
||
|
||
} catch (error) {
|
||
console.log('Details error:' + error);
|
||
return JSON.stringify([{
|
||
description: 'Error loading description',
|
||
aliases: 'N/A',
|
||
airdate: 'N/A'
|
||
}]);
|
||
}
|
||
}
|
||
|
||
async function extractChapters(url) {
|
||
try {
|
||
const response = await soraFetch(url);
|
||
const htmlText = await response.text();
|
||
console.log(htmlText);
|
||
|
||
const chapters = [];
|
||
const chapterLinkRegex = /<a\s+[^>]*href="([^"]*\/chapter\/[^"]*)"[^>]*>([\s\S]*?)<\/a>/gi;
|
||
let linkMatch;
|
||
|
||
while ((linkMatch = chapterLinkRegex.exec(htmlText)) !== null) {
|
||
const fullLinkHtml = linkMatch[0];
|
||
const href = `https://helioscans.com${linkMatch[1]}`;
|
||
|
||
const titleRegex = /<span[^>]*class="[^"]*\btext-sm\b[^"]*\btruncate\b[^"]*"[^>]*>([^<]+)<\/span>/i;
|
||
const titleMatch = titleRegex.exec(fullLinkHtml);
|
||
const rawTitle = titleMatch ? titleMatch[1].trim() : "";
|
||
|
||
if (!rawTitle) continue;
|
||
|
||
const isLocked = /Coin\.svg/i.test(fullLinkHtml);
|
||
const title = isLocked ? `${rawTitle} (Locked – 100 credits)` : rawTitle;
|
||
|
||
chapters.push({ title, href });
|
||
}
|
||
|
||
chapters.sort((a, b) => {
|
||
const numA = parseFloat(a.title.match(/Chapter\s+(\d+)/i)?.[1]) || 0;
|
||
const numB = parseFloat(b.title.match(/Chapter\s+(\d+)/i)?.[1]) || 0;
|
||
return numA - numB;
|
||
});
|
||
|
||
chapters.forEach((chapter, index) => {
|
||
chapter.number = index + 1;
|
||
});
|
||
|
||
console.log(JSON.stringify(chapters));
|
||
return JSON.stringify(chapters);
|
||
} catch (error) {
|
||
console.error('Fetch error in extractChapters:', error);
|
||
return JSON.stringify([{
|
||
href: url,
|
||
title: "Error fetching chapters",
|
||
number: 0
|
||
}]);
|
||
}
|
||
}
|
||
|
||
async function extractText(url) {
|
||
try {
|
||
const headers = {
|
||
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.3029.110 Safari/537.36',
|
||
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
|
||
'Accept-Language': 'en-US,en;q=0.5',
|
||
'Connection': 'keep-alive',
|
||
'Upgrade-Insecure-Requests': '1'
|
||
};
|
||
|
||
const response = await soraFetch(url, headers);
|
||
const htmlText = await response.text();
|
||
|
||
const startMarker = '<div id="pages"';
|
||
const startIndex = htmlText.indexOf(startMarker);
|
||
if (startIndex === -1) {
|
||
throw new Error("Pages content div start (<div id=\"pages\") not found");
|
||
}
|
||
|
||
const startTagEndIndex = htmlText.indexOf('>', startIndex);
|
||
if (startTagEndIndex === -1) {
|
||
throw new Error("Could not find the end of the opening <div id=\"pages\"> tag");
|
||
}
|
||
|
||
const contentStartIndex = startTagEndIndex + 1;
|
||
let depth = 1;
|
||
let pos = contentStartIndex;
|
||
let endIndex = -1;
|
||
|
||
while (depth > 0 && pos < htmlText.length) {
|
||
const nextOpenDiv = htmlText.indexOf('<div', pos);
|
||
const nextCloseDiv = htmlText.indexOf('</div', pos);
|
||
|
||
if (nextCloseDiv === -1) {
|
||
break;
|
||
}
|
||
|
||
if (nextOpenDiv !== -1 && nextOpenDiv < nextCloseDiv) {
|
||
depth++;
|
||
pos = nextOpenDiv + 4;
|
||
} else {
|
||
depth--;
|
||
if (depth === 0) {
|
||
endIndex = nextCloseDiv;
|
||
} else {
|
||
pos = nextCloseDiv + 5;
|
||
}
|
||
}
|
||
}
|
||
|
||
if (endIndex === -1) {
|
||
throw new Error("Matching closing </div> for pages content div not found");
|
||
}
|
||
|
||
let innerContent = htmlText.substring(contentStartIndex, endIndex);
|
||
|
||
innerContent = innerContent.replace(/<script\b[^<]*(?:(?!<\/script>)<[^<]*)*<\/script>/gi, '');
|
||
innerContent = innerContent.replace(/<div[^>]*class="[^"]*fixed[^"]*z-\[60\][^"]*top-0[^"]*left-0[^"]*w-full[^"]*h-full[^"]*bg-black\/90[^"]*flex[^"]*justify-center[^"]*items-center[\s\S]*?<\/div>/gi, '');
|
||
|
||
const paragraphRegex = /<p[^>]*>(.*?)<\/p>/gi;
|
||
let textContent = '';
|
||
let match;
|
||
|
||
while ((match = paragraphRegex.exec(innerContent)) !== null) {
|
||
const paragraphText = match[1].replace(/<[^>]*>/g, '').trim();
|
||
if (paragraphText) {
|
||
textContent += paragraphText + '\n';
|
||
}
|
||
}
|
||
|
||
innerContent = innerContent.trim();
|
||
|
||
if (!innerContent && !textContent) {
|
||
throw new Error("Chapter text not found or empty after cleaning");
|
||
}
|
||
console.log(innerContent || textContent);
|
||
return innerContent;
|
||
|
||
} catch (error) {
|
||
console.error("Fetch error in extractText: " + error.message);
|
||
return '<p>Error: This is chapter is locked as early access by the website, you will have to pay on the website or wait for the chapter to be released globally</p>';
|
||
}
|
||
}
|
||
|
||
async function soraFetch(url, options = {
|
||
headers: {},
|
||
method: 'GET',
|
||
body: null
|
||
}) {
|
||
try {
|
||
return await fetchv2(url, options.headers ?? {}, options.method ?? 'GET', options.body ?? null);
|
||
} catch (e) {
|
||
try {
|
||
return await fetch(url, options);
|
||
} catch (error) {
|
||
return null;
|
||
}
|
||
}
|
||
}
|
||
|
||
function decodeHtmlEntities(text) {
|
||
const entities = {
|
||
'—': '—',
|
||
'–': '–',
|
||
'&': '&',
|
||
'<': '<',
|
||
'>': '>',
|
||
'"': '"',
|
||
''': "'",
|
||
'/': '/',
|
||
'`': '`',
|
||
'=': '=',
|
||
' ': ' '
|
||
};
|
||
|
||
return text.replace(/&#x[\dA-Fa-f]+;|&\w+;/g, (match) => {
|
||
return entities[match] || match;
|
||
});
|
||
}
|