You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
65 lines
1.9 KiB
65 lines
1.9 KiB
import db from "../db/index" |
|
import Elastic from "./modules/elastic" |
|
import Parser from "./modules/parser" |
|
import { SHOULD_NOT_PARSE } from "./modules/parser/helpers" |
|
import { Domain } from "domain" |
|
|
|
type SubPages = Record<string, boolean> |
|
|
|
const findFirstNotIndexed = (subpages: SubPages = {}) => { |
|
return Object.entries(subpages).find(([url, isIndexed]) => !isIndexed)?.[0] |
|
} |
|
|
|
const indexWebsite = async (domain: string, path: string, subpages: SubPages = {},count=0) => { |
|
console.log(subpages) |
|
const subpagesLength = Object.keys(subpages).length; |
|
if (!subpages[path]) { |
|
const url = domain + path; |
|
const parseInfo = await Parser.parseUrl(url) |
|
console.log(parseInfo) |
|
subpages[path] = true |
|
let pages = {} |
|
if (parseInfo !== SHOULD_NOT_PARSE && subpagesLength < 50) { |
|
await Elastic.index(parseInfo.elasticData) |
|
pages = { |
|
...parseInfo.subPages, |
|
...subpages, |
|
} |
|
} else { |
|
pages = subpages |
|
} |
|
const firstNotIndexed = findFirstNotIndexed(pages) |
|
if (firstNotIndexed) { |
|
return await indexWebsite(domain, firstNotIndexed, pages, count +1) |
|
} |
|
} else { |
|
const firstNotIndexed = findFirstNotIndexed(subpages) |
|
if (firstNotIndexed) { |
|
return await indexWebsite(domain, firstNotIndexed, subpages, count +1) |
|
} |
|
} |
|
} |
|
|
|
|
|
const main = async () => { |
|
await indexWebsite('http://planets.ton', "/") |
|
console.log('finish') |
|
return |
|
await Elastic.initElastic() |
|
const domains = await db.nftDomain.findMany({where:{available: true}}) |
|
console.log('Find domains', domains) |
|
if (domains) { |
|
for (const domain of domains) { |
|
await db.nftDomain.update({ |
|
where: { address: domain.address }, |
|
data: { lastParse: new Date() }, |
|
}) |
|
console.log('Start index domain: ',domain.address) |
|
await indexWebsite(domain.address, "/") |
|
} |
|
} |
|
console.log('Finish parse domains') |
|
} |
|
|
|
|
|
export default main
|
|
|