Skip to main content

date-extractors

ai-research-agent / extractor/html-to-cite/extract-date/date-extractors

Functions

custom_parse()

function custom_parse(
string,
outputformat,
min_date,
max_date): null | string

Parameters

ParameterType

string

any

outputformat

any

min_date

any

max_date

any

Returns

null | string


discard_unwanted()

function discard_unwanted(tree): any[]

Parameters

ParameterType

tree

any

Returns

any[]


external_date_parser()

function external_date_parser(string, outputformat): null | string

Parameters

ParameterType

string

any

outputformat

any

Returns

null | string


extract_url_date()

function extract_url_date(testurl, options): null | string

Parameters

ParameterType

testurl

any

options

any

Returns

null | string


function idiosyncrasies_search(htmlstring, options): null | string

Parameters

ParameterType

htmlstring

any

options

any

Returns

null | string


function img_search(tree, options): null | string

Parameters

ParameterType

tree

any

options

any

Returns

null | string


function json_search(tree, options): any

Parameters

ParameterType

tree

any

options

any

Returns

any


function pattern_search(
text,
date_pattern,
options): any

Parameters

ParameterType

text

any

date_pattern

any

options

any

Returns

any


regex_parse()

function regex_parse(string): null | Date

Parameters

ParameterType

string

any

Returns

null | Date


try_date_expr()

function try_date_expr(
string,
outputformat,
extensive_search,
min_date,
max_date): null | string

Parameters

ParameterType

string

any

outputformat

any

extensive_search

any

min_date

any

max_date

any

Returns

null | string

Variables

const COPYRIGHT_PATTERN: RegExp;

DATE_EXPRESSIONS

const DATE_EXPRESSIONS: string;

DATESTRINGS_CATCH

const DATESTRINGS_CATCH: RegExp;

DATESTRINGS_PATTERN

const DATESTRINGS_PATTERN: RegExp;

FAST_PREPEND

const FAST_PREPEND: "" = '';

FREE_TEXT_EXPRESSIONS

const FREE_TEXT_EXPRESSIONS: ".//*[self::div or self::h2 or self::h3 or self::h4 or self::li or self::p or self::span or self::time or self::ul]/text()" = ".//*[self::div or self::h2 or self::h3 or self::h4 or self::li or self::p or self::span or self::time or self::ul]/text()";

MAX_SEGMENT_LEN

const MAX_SEGMENT_LEN: 52 = 52;

MIN_SEGMENT_LEN

const MIN_SEGMENT_LEN: 6 = 6;

MMYYYY_PATTERN

const MMYYYY_PATTERN: RegExp;

MMYYYY_YEAR

const MMYYYY_YEAR: RegExp;

SELECT_YMD_PATTERN

const SELECT_YMD_PATTERN: RegExp;

SELECT_YMD_YEAR

const SELECT_YMD_YEAR: RegExp;

SIMPLE_PATTERN

const SIMPLE_PATTERN: RegExp;

SLASHES_PATTERN

const SLASHES_PATTERN: RegExp;

SLASHES_YEAR

const SLASHES_YEAR: RegExp;

SLOW_PREPEND

const SLOW_PREPEND: "" = "";

THREE_CATCH

const THREE_CATCH: RegExp;

THREE_COMP_REGEX_A

const THREE_COMP_REGEX_A: RegExp;

THREE_COMP_REGEX_B

const THREE_COMP_REGEX_B: RegExp;

THREE_LOOSE_CATCH

const THREE_LOOSE_CATCH: RegExp;

THREE_LOOSE_PATTERN

const THREE_LOOSE_PATTERN: RegExp;

THREE_PATTERN

const THREE_PATTERN: RegExp;

TIMESTAMP_PATTERN

const TIMESTAMP_PATTERN: RegExp;

TWO_COMP_REGEX

const TWO_COMP_REGEX: RegExp;

YEAR_PATTERN

const YEAR_PATTERN: RegExp;

YMD_PATTERN

const YMD_PATTERN: RegExp;

YMD_YEAR

const YMD_YEAR: RegExp;

YYYYMM_CATCH

const YYYYMM_CATCH: RegExp;

YYYYMM_PATTERN

const YYYYMM_PATTERN: RegExp;