feat: Add @mozilla/readability dependency for extracting content from web pages

This commit is contained in:
n4ze3m
2024-06-22 00:25:12 +05:30
parent 56cea30058
commit d23b70b979
7 changed files with 136 additions and 3 deletions

View File

@@ -4,6 +4,7 @@ import { webDuckDuckGoSearch } from "./search-engines/duckduckgo"
import { getSearchProvider } from "@/services/search"
import { webSogouSearch } from "./search-engines/sogou"
import { webBraveSearch } from "./search-engines/brave"
import { getWebsiteFromQuery, processSingleWebsite } from "./website"
const getHostName = (url: string) => {
try {
@@ -29,8 +30,25 @@ const searchWeb = (provider: string, query: string) => {
export const getSystemPromptForWeb = async (query: string) => {
try {
const searchProvider = await getSearchProvider()
const search = await searchWeb(searchProvider, query)
const websiteVisit = getWebsiteFromQuery(query)
let search: {
url: any;
content: string;
}[] = []
if (websiteVisit.hasUrl) {
const url = websiteVisit.url
const queryWithoutUrl = websiteVisit.queryWithouUrls
search = await processSingleWebsite(url, queryWithoutUrl)
} else {
const searchProvider = await getSearchProvider()
search = await searchWeb(searchProvider, query)
}
const search_results = search
.map(