FunctionsExtractorHtml to citeExtract date

Date Extractors

ai-research-agent / extractor/html-to-cite/extract-date/date-extractors

const COPYRIGHT_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:89


DATE_EXPRESSIONS

const DATE_EXPRESSIONS: string;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:40


DATESTRINGS_CATCH

const DATESTRINGS_CATCH: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:98


DATESTRINGS_PATTERN

const DATESTRINGS_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:97


FAST_PREPEND

const FAST_PREPEND: "" = '';

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:30


FREE_TEXT_EXPRESSIONS

const FREE_TEXT_EXPRESSIONS: ".//*[self::div or self::h2 or self::h3 or self::h4 or self::li or self::p or self::span or self::time or self::ul]/text()" = ".//*[self::div or self::h2 or self::h3 or self::h4 or self::li or self::p or self::span or self::time or self::ul]/text()";

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:80


MAX_SEGMENT_LEN

const MAX_SEGMENT_LEN: 52 = 52;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:34


MIN_SEGMENT_LEN

const MIN_SEGMENT_LEN: 6 = 6;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:33


MMYYYY_PATTERN

const MMYYYY_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:103


MMYYYY_YEAR

const MMYYYY_YEAR: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:104


SELECT_YMD_PATTERN

const SELECT_YMD_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:94


SELECT_YMD_YEAR

const SELECT_YMD_YEAR: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:95


SIMPLE_PATTERN

const SIMPLE_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:105


SLASHES_PATTERN

const SLASHES_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:99


SLASHES_YEAR

const SLASHES_YEAR: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:100


SLOW_PREPEND

const SLOW_PREPEND: "" = "";

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:74


THREE_CATCH

const THREE_CATCH: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:91


THREE_COMP_REGEX_A

const THREE_COMP_REGEX_A: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:83


THREE_COMP_REGEX_B

const THREE_COMP_REGEX_B: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:84


THREE_LOOSE_CATCH

const THREE_LOOSE_CATCH: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:93


THREE_LOOSE_PATTERN

const THREE_LOOSE_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:92


THREE_PATTERN

const THREE_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:90


TIMESTAMP_PATTERN

const TIMESTAMP_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:140


TWO_COMP_REGEX

const TWO_COMP_REGEX: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:85


YEAR_PATTERN

const YEAR_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:88


YMD_PATTERN

const YMD_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:109


YMD_YEAR

const YMD_YEAR: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:96


YYYYMM_CATCH

const YYYYMM_CATCH: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:102


YYYYMM_PATTERN

const YYYYMM_PATTERN: RegExp;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:101


custom_parse()

function custom_parse(
   string: any, 
   outputformat: any, 
   min_date: any, 
   max_date: any): string;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:247

Parameters

ParameterType

string

any

outputformat

any

min_date

any

max_date

any

Returns

string


discard_unwanted()

function discard_unwanted(tree: any): any[];

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:186

Parameters

ParameterType

tree

any

Returns

any[]


external_date_parser()

function external_date_parser(string: any, outputformat: any): string;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:342

Parameters

ParameterType

string

any

outputformat

any

Returns

string


extract_url_date()

function extract_url_date(testurl: any, options: any): string;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:196

Parameters

ParameterType

testurl

any

options

any

Returns

string


function idiosyncrasies_search(htmlstring: any, options: any): string;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:416

Parameters

ParameterType

htmlstring

any

options

any

Returns

string


function img_search(tree: any, options: any): string;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:386

Parameters

ParameterType

tree

any

options

any

Returns

string


function json_search(tree: any, options: any): any;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:403

Parameters

ParameterType

tree

any

options

any

Returns

any


function pattern_search(
   text: any, 
   date_pattern: any, 
   options: any): any;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:394

Parameters

ParameterType

text

any

date_pattern

any

options

any

Returns

any


regex_parse()

function regex_parse(string: any): Date;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:225

Parameters

ParameterType

string

any

Returns

Date


try_date_expr()

function try_date_expr(
   string: any, 
   outputformat: any, 
   extensive_search: any, 
   min_date: any, 
   max_date: any): string;

Defined in: src/extractor/html-to-cite/extract-date/date-extractors.js:356

Parameters

ParameterType

string

any

outputformat

any

extensive_search

any

min_date

any

max_date

any

Returns

string