mirror of
https://github.com/catdevnull/preciazo.git
synced 2024-11-26 03:26:19 +00:00
ignorar paginas status!=200
This commit is contained in:
parent
7b989f0ea0
commit
405502877c
1 changed files with 6 additions and 0 deletions
|
@ -52,6 +52,12 @@ export async function parseWarc(path: string) {
|
||||||
console.debug(`skipped ${warcRecordId}`);
|
console.debug(`skipped ${warcRecordId}`);
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
if (record.httpHeaders?.statusCode !== 200) {
|
||||||
|
console.debug(
|
||||||
|
`skipped ${warcRecordId} because status=${record.httpHeaders?.statusCode} (!=200)`
|
||||||
|
);
|
||||||
|
continue;
|
||||||
|
}
|
||||||
// TODO: sobreescribir si existe el mismo record-id pero con version mas bajo?
|
// TODO: sobreescribir si existe el mismo record-id pero con version mas bajo?
|
||||||
|
|
||||||
const html = await record.contentText();
|
const html = await record.contentText();
|
||||||
|
|
Loading…
Reference in a new issue