acorn_lib/
constants.rs

1//! # Constants, regular expressions, and configuration values
2//!
3//! This module contains a collection of regular expressions, configuration values, and guidelines for research activity data. This includes section character counts and line counts.
4//!
5use fancy_regex::Regex;
6use lazy_static::lazy_static;
7
8/// ORNL disclaimer
9pub const DISCLAIMER: &str = "Oak Ridge National Laboratory is managed by UT-Batelle LLC for the US Department of Energy";
10/// Base URL for deploying ORNL data
11pub const BASE_URL: &str = "https://research.ornl.gov";
12/// RGB color for transparency
13pub const COLOR_TRANSPARENT: [u8; 4] = [255, 255, 255, 0];
14/// RGB ORNL brand primary color
15///
16// See <https://www.olcf.ornl.gov/about-olcf/media-assets/>
17pub const COLOR_PRIMARY: [u8; 4] = [0, 121, 52, 255];
18/// URL for Vale releases
19pub const VALE_RELEASES_URL: &str = "https://github.com/errata-ai/vale/releases";
20/// Version of Vale to use with ACORN
21pub const VALE_VERSION: &str = "3.9.4";
22/// Default Vale configuration path
23pub const DEFAULT_VALE_ROOT: &str = "./.vale/";
24/// URL for custom ORNL Science Vale package
25pub const DEFAULT_VALE_PACKAGE_URL: &str = "https://code.ornl.gov/research-enablement/vale-package/-/archive/v0.0.1/vale-package-v0.0.1.zip";
26/// Custom Vale package name
27pub const CUSTOM_VALE_PACKAGE_NAME: &str = "Science";
28/// Enabled Vale packages
29pub const ENABLED_VALE_PACKAGES: [&str; 4] = ["Google", "proselint", "write-good", "Joblint"];
30/// Disabled Vale rules
31pub const DISABLED_VALE_RULES: [&str; 14] = [
32    "Vale.Terms",
33    "Google.EmDash",
34    "Google.Contractions",
35    "Google.GenderBias",
36    "Google.Headings",
37    "Google.Parens",
38    "Google.Quotes",
39    "Google.We",
40    "Joblint.Competitive",
41    "proselint.GenderBias",
42    "write-good.E-Prime",
43    "write-good.Passive",
44    "write-good.TooWordy",
45    "write-good.Weasel",
46];
47// Project folder values
48/// Application name
49pub const APPLICATION: &str = "acorn";
50/// Organization name
51pub const ORGANIZATION: &str = "ornl";
52/// Organization qualifier
53pub const QUALIFIER: &str = "org";
54// Schema defaults
55/// Default affiliation
56pub const DEFAULT_AFFILIATION: &str = "Oak Ridge National Laboratory";
57/// Default graphic content URL (href)
58pub const DEFAULT_GRAPHIC_HREF: &str = "00.png";
59/// Default graphic caption
60pub const DEFAULT_GRAPHIC_CAPTION: &str = "";
61/// Default schema URI for ORCiD values
62pub const DEFAULT_ORCID_SCHEMA_URI: &str = "https://orcid.org/";
63/// Maxumum number of [`ResearchActivity`] [`approaches`]
64///
65/// [`ResearchActivity`]: ../schema/struct.ResearchActivity.html
66/// [`approaches`]: ../schema/struct.Sections.html#structfield.approach
67pub const MAX_COUNT_APPROACH: u64 = 6;
68/// Maxumum number of [`ResearchActivity`] [`capabilities`]
69///
70/// [`ResearchActivity`]: ../schema/struct.ResearchActivity.html
71/// [`capabilities`]: ../schema/struct.Sections.html#structfield.capabilities
72pub const MAX_COUNT_CAPABILITIES: u64 = 6;
73/// Maxumum number of [impact statements](../schema/struct.Sections.html#structfield.impact)
74pub const MAX_COUNT_IMPACT: u64 = 6;
75/// Maximum number of [research areas](../schema/struct.Research.html#structfield.areas)
76pub const MAX_COUNT_RESEARCH_AREAS: u64 = 4;
77/// Maximum number of characters for an [`approach`] statement
78///
79/// [`approach`]: ../schema/struct.Sections.html#structfield.approach
80pub const MAX_LENGTH_APPROACH: usize = 150;
81/// Maximum number of characters for a single [`capability`] description
82///
83/// [`capability`]: ../schema/struct.Sections.html#structfield.capabilities
84pub const MAX_LENGTH_CAPABILIY: usize = 300;
85/// Maximum number of characters for a single image caption
86pub const MAX_LENGTH_IMAGE_CAPTION: u64 = 100;
87/// Maximum number of characters for a single impact description
88pub const MAX_LENGTH_IMPACT: usize = 150;
89/// Maximum number of characters for a single [research area](../schema/struct.Research.html#structfield.areas) description
90pub const MAX_LENGTH_RESEARCH_AREA: usize = 40;
91/// Maximum number of characters for an single [research focus](../schema/struct.Research.html#structfield.focus) description
92pub const MAX_LENGTH_RESEARCH_FOCUS: u64 = 150;
93/// Maximum number of characters for a  [challenge](../schema/struct.Sections.html#structfield.challenge) section
94pub const MAX_LENGTH_SECTION_CHALLENGE: u64 = 500;
95/// Maximum number of characters for a [mission](../schema/struct.Sections.html#structfield.mission) section
96pub const MAX_LENGTH_SECTION_MISSION: u64 = 250;
97/// Maximum number of characters for a [`subtitle`]
98///
99/// [`subtitle`]: ../schema/struct.ResearchActivity.html#structfield.subtitle
100pub const MAX_LENGTH_SUBTITLE: u64 = 75;
101/// Maximum number of characters for a [`title`]
102///
103/// [`title`]: ../schema/struct.ResearchActivity.html#structfield.title
104pub const MAX_LENGTH_TITLE: u64 = 45;
105// Readability defaults
106/// Automated Readability Index (ARI) maximum allowed value
107///
108/// This value maps to 12th grade (high school senior) reading level
109pub const MAX_ALLOWED_ARI: f64 = 18.0;
110/// Coleman-Liau Index (CLI) maximum allowed value
111///
112/// This value maps to 12th grade (high school senior) reading level
113pub const MAX_ALLOWED_CLI: f64 = 12.0;
114/// Flesch-Kincaid Grade Level (FKGL) maximum allowed value
115///
116/// This value maps to 12th grade (high school senior) reading level
117pub const MAX_ALLOWED_FKGL: f64 = 12.0;
118/// Flesch Reading Ease Score (FRES) maximum allowed value
119///
120/// This value maps to 12th grade (high school senior) reading level
121pub const MAX_ALLOWED_FRES: f64 = 50.0;
122/// Gunning Fog Index (GFI) maximum allowed value
123///
124/// This value maps to 12th grade (high school senior) reading level
125pub const MAX_ALLOWED_GFI: f64 = 12.0;
126/// Lix Index (Lix) maximum allowed va
127///
128/// This value is somewhere in between "very easy" (20) and "very difficult" (60), skewed toward "very difficult"
129pub const MAX_ALLOWED_LIX: f64 = 50.0;
130/// Simple Measure of Gobbledygook (SMOG) maximum allowed value
131///
132/// This value maps to upper end of high school (12th grade) reading level
133pub const MAX_ALLOWED_SMOG: f64 = 13.0;
134/// Pattern text for ARK regular expression defined by [`RE_ARK`]
135pub const RE_ARK_TEXT: &str = r#"^(?<nma>(?<schema_uri>https\:\/\/).+)?\/?(?<label>ark\:\/?)\/?(?<naan>\d{2,9})\/(?<assigned_name>[a-z0-9A-Z]+)?\/?(?<parts>[^.]+)?\.?(?<variants>[a-zA-Z0-9-.]+)?$"#;
136/// Pattern text for DOI regular expression defined by [`RE_DOI`]
137pub const RE_DOI_TEXT: &str =
138    r#"^(?<schema_uri>https[:]\/\/doi\.org\/)?(?<directory_indicator>10).(?<registrant_code>\d{4,9})\/(?<suffix>[-._;()/:a-zA-Z0-9]+)$"#;
139/// Patter text for ORCiD regular expression defined by [`RE_ORCID`]
140pub const RE_ORCID_TEXT: &str =
141    r#"^(?<schema_uri>https[:]\/\/orcid\.org\/)?(?<identifier>[0-9]{4}-?[0-9]{4}-?[0-9]{4}-?[0-9]{3}(?<check_digit>[0-9X]))$"#;
142
143lazy_static! {
144    /// Regex that should match a Archival Resource Key (ARK)
145    ///
146    /// See <https://arks.org/> for more information
147    pub static ref RE_ARK: Regex = Regex::new(RE_ARK_TEXT).unwrap();
148    /// Regex that should match a Digital Object Identifier (DOI)
149    ///
150    /// See <https://www.doi.org/doi-handbook/HTML/index.html> for more information
151    pub static ref RE_DOI: Regex = Regex::new(RE_DOI_TEXT).unwrap();
152    /// Regex that should match an Open Researcher and Contributor ID (ORCiD) value
153    ///
154/// See <https://orcid.org/> for more information
155    pub static ref RE_ORCID: Regex = Regex::new(RE_ORCID_TEXT).unwrap();
156    /// Regex that should match a Research Activity Identifier (RAiD)
157    ///
158    /// See <https://raid.org/> for more information
159    pub static ref RE_RAID: Regex = Regex::new(RE_DOI_TEXT).unwrap();
160    /// Regex that should match a Research Organization Registry (ROR)
161    ///
162    /// See <https://www.ror.org/> for more information
163    pub static ref RE_ROR: Regex = Regex::new(r#"^(?<schema_uri>(https[:]\/\/ror\.org\/)|(ror[.]org\/))?0[a-hj-km-np-tv-z|0-9]{6}[0-9]{2}$"#).unwrap();
164    /// Regex that should match an image extension (e.g. .png, .jpg, .jpeg, .svg)
165    pub static ref RE_IMAGE_EXTENSION: Regex = Regex::new(r#".*[.](png|PNG|jpg|JPG|jpeg|JPEG|svg|SVG|gif|GIF|webp|WEBP|tiff|TIFF)$"#).unwrap();
166    /// Regex that should match an IP6 address
167    pub static ref RE_IP6: Regex = Regex::new(r#"(([0-9a-fA-F]{1,4}:){7,7}[0-9a-fA-F]{1,4}|([0-9a-fA-F]{1,4}:){1,7}:|([0-9a-fA-F]{1,4}:){1,6}:[0-9a-fA-F]{1,4}|([0-9a-fA-F]{1,4}:){1,5}(:[0-9a-fA-F]{1,4}){1,2}|([0-9a-fA-F]{1,4}:){1,4}(:[0-9a-fA-F]{1,4}){1,3}|([0-9a-fA-F]{1,4}:){1,3}(:[0-9a-fA-F]{1,4}){1,4}|([0-9a-fA-F]{1,4}:){1,2}(:[0-9a-fA-F]{1,4}){1,5}|[0-9a-fA-F]{1,4}:((:[0-9a-fA-F]{1,4}){1,6})|:((:[0-9a-fA-F]{1,4}){1,7}|:)|fe80:(:[0-9a-fA-F]{0,4}){0,4}%[0-9a-zA-Z]{1,}|::(ffff(:0{1,4}){0,1}:){0,1}((25[0-5]|(2[0-4]|1{0,1}[0-9]){0,1}[0-9])\.){3,3}(25[0-5]|(2[0-4]|1{0,1}[0-9]){0,1}[0-9])|([0-9a-fA-F]{1,4}:){1,4}:((25[0-5]|(2[0-4]|1{0,1}[0-9]){0,1}[0-9])\.){3,3}(25[0-5]|(2[0-4]|1{0,1}[0-9]){0,1}[0-9]))"#).unwrap();
168    /// Regex that should match an ISO 8601 date (e.g., `YYYY-MM-DD`)
169    /// ### Example
170    /// > `2025-06-04`
171    pub static ref RE_ISO_8601_DATE: Regex = Regex::new(r#"^(?<year>(19[5-9][0-9]|20[0-2][0-9]))-(?<month>(((0[13578]|(10|12)))-(?<day>(0[1-9]|[1-2][0-9]|3[0-1]))|(02-(0[1-9]|[1-2][0-9]))|((0[469]|11)-(0[1-9]|[1-2][0-9]|30))))$"#).unwrap();
172    /// Regex that should match an ISO 8601 year from modern times, 1950 through 2029
173    /// ### Example
174    /// > `2025`
175    pub static ref RE_ISO_8601_YEAR: Regex = Regex::new(r#"^(?<year>(19[5-9][0-9]|20[0-2][0-9]))$"#).unwrap();
176    /// Regex that should match a phone number (with optional country and area codes)
177    pub static ref RE_PHONE: Regex = Regex::new(r#"^(?<country>\+\d{1,2}\s?)?(?<area>\(?\d{3}\)?)[\s.-]?(?<prefix>\d{3})[\s.-]?(?<line>\d{4})$"#).unwrap();
178    /// Regex that should match a fake phone number (e.g. 555.555.5555)
179    pub static ref RE_FAKE_PHONE: Regex = Regex::new(r#"^(\+\d{1,2}\s?)?\(?5{3}\)?[\s.-]?5{3}[\s.-]?5{4}$"#).unwrap();
180    /// Regex that should match a Unix epoch (ex. 1759017645)
181    pub static ref RE_UNIX_EPOCH: Regex = Regex::new(r#"^\d{10}$"#).unwrap();
182}