date-extractors
ai-research-agent / extractor/html-to-cite/extract-date/date-extractors
Functions
custom_parse()
function custom_parse(
string,
outputformat,
min_date,
max_date): null | string
Parameters
Parameter | Type |
---|---|
|
|
|
|
|
|
|
|
Returns
null
| string
discard_unwanted()
function discard_unwanted(tree): any[]
Parameters
Parameter | Type |
---|---|
|
|
Returns
any
[]
external_date_parser()
function external_date_parser(string, outputformat): null | string
Parameters
Parameter | Type |
---|---|
|
|
|
|
Returns
null
| string
extract_url_date()
function extract_url_date(testurl, options): null | string
Parameters
Parameter | Type |
---|---|
|
|
|
|
Returns
null
| string
idiosyncrasies_search()
function idiosyncrasies_search(htmlstring, options): null | string
Parameters
Parameter | Type |
---|---|
|
|
|
|
Returns
null
| string
img_search()
function img_search(tree, options): null | string
Parameters
Parameter | Type |
---|---|
|
|
|
|
Returns
null
| string
json_search()
function json_search(tree, options): any
Parameters
Parameter | Type |
---|---|
|
|
|
|
Returns
any
pattern_search()
function pattern_search(
text,
date_pattern,
options): any
Parameters
Parameter | Type |
---|---|
|
|
|
|
|
|
Returns
any
regex_parse()
function regex_parse(string): null | Date
Parameters
Parameter | Type |
---|---|
|
|
Returns
null
| Date
try_date_expr()
function try_date_expr(
string,
outputformat,
extensive_search,
min_date,
max_date): null | string
Parameters
Parameter | Type |
---|---|
|
|
|
|
|
|
|
|
|
|
Returns
null
| string
Variables
COPYRIGHT_PATTERN
const COPYRIGHT_PATTERN: RegExp;
DATE_EXPRESSIONS
const DATE_EXPRESSIONS: string;
DATESTRINGS_CATCH
const DATESTRINGS_CATCH: RegExp;
DATESTRINGS_PATTERN
const DATESTRINGS_PATTERN: RegExp;
FAST_PREPEND
const FAST_PREPEND: "" = '';
FREE_TEXT_EXPRESSIONS
const FREE_TEXT_EXPRESSIONS: ".//*[self::div or self::h2 or self::h3 or self::h4 or self::li or self::p or self::span or self::time or self::ul]/text()" = ".//*[self::div or self::h2 or self::h3 or self::h4 or self::li or self::p or self::span or self::time or self::ul]/text()";
MAX_SEGMENT_LEN
const MAX_SEGMENT_LEN: 52 = 52;
MIN_SEGMENT_LEN
const MIN_SEGMENT_LEN: 6 = 6;
MMYYYY_PATTERN
const MMYYYY_PATTERN: RegExp;
MMYYYY_YEAR
const MMYYYY_YEAR: RegExp;
SELECT_YMD_PATTERN
const SELECT_YMD_PATTERN: RegExp;
SELECT_YMD_YEAR
const SELECT_YMD_YEAR: RegExp;
SIMPLE_PATTERN
const SIMPLE_PATTERN: RegExp;
SLASHES_PATTERN
const SLASHES_PATTERN: RegExp;
SLASHES_YEAR
const SLASHES_YEAR: RegExp;
SLOW_PREPEND
const SLOW_PREPEND: "" = "";
THREE_CATCH
const THREE_CATCH: RegExp;
THREE_COMP_REGEX_A
const THREE_COMP_REGEX_A: RegExp;
THREE_COMP_REGEX_B
const THREE_COMP_REGEX_B: RegExp;
THREE_LOOSE_CATCH
const THREE_LOOSE_CATCH: RegExp;
THREE_LOOSE_PATTERN
const THREE_LOOSE_PATTERN: RegExp;
THREE_PATTERN
const THREE_PATTERN: RegExp;
TIMESTAMP_PATTERN
const TIMESTAMP_PATTERN: RegExp;
TWO_COMP_REGEX
const TWO_COMP_REGEX: RegExp;
YEAR_PATTERN
const YEAR_PATTERN: RegExp;
YMD_PATTERN
const YMD_PATTERN: RegExp;
YMD_YEAR
const YMD_YEAR: RegExp;
YYYYMM_CATCH
const YYYYMM_CATCH: RegExp;
YYYYMM_PATTERN
const YYYYMM_PATTERN: RegExp;