with LlamaIndex and FireCrawl?
Crawls a given URL and returns the contents of sub-pages. See the documentation
Extract structured data from one or multiple URLs. See the documentation
Obtains the status and data from a previous crawl operation. See the documentation
Obtains the status and data from a previous extract operation. See the documentation
Scrapes a URL and returns content from that page. See the documentation
import { axios } from "@pipedream/platform";
import FormData from "form-data";
import request from "request";
export default defineComponent({
props: {
llamaindex: {
type: "app",
app: "llamaindex",
}
},
async run({steps, $}) {
const data = new FormData();
data.append("file", request("https://www.learningcontainer.com/wp-content/uploads/2019/09/sample-pdf-file.pdf"));
return await axios($, {
method: "POST",
url: `${this.llamaindex.$auth.url}/api/parsing/upload`,
headers: {
"Content-Type": `multipart/form-data`,
Authorization: `Bearer ${this.llamaindex.$auth.api_key}`,
},
data,
})
},
})
import { axios } from "@pipedream/platform"
export default defineComponent({
props: {
firecrawl: {
type: "app",
app: "firecrawl",
}
},
async run({steps, $}) {
const data = {
"url": "https://pipedream.com",
}
return await axios($, {
method: "post",
url: `https://api.firecrawl.dev/v0/crawl`,
headers: {
Authorization: `Bearer ${this.firecrawl.$auth.api_key}`,
},
data,
})
},
})