-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Cont. work on processScans, handling diff. statuses, matching result IDs
- Loading branch information
1 parent
cd5398f
commit b815ced
Showing
1 changed file
with
80 additions
and
4 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,14 +1,90 @@ | ||
import { jwtClaims } from 'app'; | ||
import { pgClient } from 'utils'; | ||
|
||
export const processScans = async () => { | ||
// This route is called once every minute by Amazon EventBridge Scheduler | ||
await pgClient.connect(); | ||
const scans = (await pgClient.query(`SELECT "id", "job_id" FROM "scans" WHERE "processing"=TRUE ORDER BY "created_at" DESC`)).rows; | ||
const scans = (await pgClient.query(`SELECT "id", "job_id", "property_id" FROM "scans" WHERE "processing"=TRUE ORDER BY "created_at" DESC`)).rows; | ||
for (const scan of scans) { | ||
const response = await (await fetch(`https://scan.equalify.app/results/${scan.job_id}`)).json(); | ||
if (response?.status === 'completed') { | ||
await pgClient.query(`UPDATE "scans" SET "processing"=FALSE, "results"=$1`, [response?.result]); | ||
try { | ||
const { result, status } = await (await fetch(`https://scan.equalify.app/results/${scan.job_id}`)).json(); | ||
if (['delayed', 'active', 'waiting'].includes(status)) { | ||
console.log(`Scan ${scan.id} is ${status}- scan skipped.`); | ||
} | ||
else if (['failed', 'unknown'].includes(status)) { | ||
await pgClient.query(`DELETE FROM "scans" WHERE "id"=$1`, [scan.id]); | ||
console.log(`Scan ${scan.id} is ${status}- scan deleted.`); | ||
} | ||
else if (['completed'].includes(status)) { | ||
await scanProcessor({ result, scan }); | ||
console.log(`Scan ${scan.id} is ${status}- scan complete!`); | ||
} | ||
} | ||
catch (err) { | ||
console.log(`Scan ${scan.id} ran into an error: ${err.message}`); | ||
} | ||
} | ||
await pgClient.clean(); | ||
return; | ||
} | ||
|
||
const scanProcessor = async ({ result, scan }) => { | ||
// 1. Set processing to FALSE to prevent API from accidentally re-processing the same scan | ||
await pgClient.query(`UPDATE "scans" SET "processing"=FALSE, "results"=$1`, [result]); | ||
|
||
// 2. Find existing IDs for urls, messages, tags, & nodes (or create them) | ||
for (const row of result.urls) { | ||
row.id = | ||
(await pgClient.query({ | ||
text: `SELECT "id" FROM "urls" WHERE "user_id"=$1 AND "url"=$2 AND "property_id"=$3`, | ||
values: [jwtClaims.sub, row.url, scan.property_id], | ||
})).rows?.[0]?.id | ||
?? | ||
(await pgClient.query({ | ||
text: `INSERT INTO "urls" ("user_id", "url", "property_id") VALUES ($1, $2, $3) RETURNING "id"`, | ||
values: [jwtClaims.sub, row.url, scan.property_id] | ||
})).rows?.[0]?.id; | ||
} | ||
for (const row of result.messages) { | ||
row.id = | ||
(await pgClient.query({ | ||
text: `SELECT "id" FROM "messages" WHERE "user_id"=$1 AND "message"=$2 AND "type"=$3`, | ||
values: [jwtClaims.sub, row.message, row.type], | ||
})).rows?.[0]?.id | ||
?? | ||
(await pgClient.query({ | ||
text: `INSERT INTO "messages" ("user_id", "message", "type") VALUES ($1, $2, $3) RETURNING "id"`, | ||
values: [jwtClaims.sub, row.message, row.type], | ||
})).rows?.[0]?.id; | ||
} | ||
for (const row of result.tags) { | ||
row.id = | ||
(await pgClient.query({ | ||
text: `SELECT "id" FROM "tags" WHERE "user_id"=$1 AND "tag"=$2`, | ||
values: [jwtClaims.sub, row.tag], | ||
})).rows?.[0]?.id | ||
?? | ||
(await pgClient.query({ | ||
text: `INSERT INTO "tags" ("user_id", "tag") VALUES ($1, $2) RETURNING "id"`, | ||
values: [jwtClaims.sub, row.tag], | ||
})).rows?.[0]?.id; | ||
} | ||
for (const row of result.nodes) { | ||
row.id = | ||
(await pgClient.query({ | ||
text: `SELECT "id" FROM "nodes" WHERE "user_id"=$1 AND "html"=$2 AND "targets"=$3 AND "url_id"=$4`, | ||
values: [jwtClaims.sub, row.html, row.targets, row.url_id], | ||
})).rows?.[0]?.id | ||
?? | ||
(await pgClient.query({ | ||
text: `INSERT INTO "nodes" ("user_id", "html", "targets", "url_id") VALUES ($1, $2, $3, $4) RETURNING "id"`, | ||
values: [jwtClaims.sub, row.html, row.targets, row.url_id], | ||
})).rows?.[0]?.id; | ||
} | ||
|
||
// 3. Compare & update nodes | ||
|
||
// 4. Delete the scan and move on! | ||
await pgClient.query(`DELETE FROM "scans" WHERE "id"=$1`, [scan.id]); | ||
return; | ||
} |