sqruff_lib/rules/references/
rf05.rsuse ahash::{AHashMap, AHashSet};
use regex::Regex;
use sqruff_lib_core::dialects::init::DialectKind;
use sqruff_lib_core::dialects::syntax::{SyntaxKind, SyntaxSet};
use crate::core::config::Value;
use crate::core::rules::base::{Erased, ErasedRule, LintResult, Rule, RuleGroups};
use crate::core::rules::context::RuleContext;
use crate::core::rules::crawlers::{Crawler, SegmentSeekerCrawler};
use crate::utils::identifers::identifiers_policy_applicable;
#[derive(Clone, Default, Debug)]
pub struct RuleRF05 {
quoted_identifiers_policy: String,
unquoted_identifiers_policy: String,
allow_space_in_identifier: bool,
additional_allowed_characters: String,
ignore_words: Vec<String>,
ignore_words_regex: Vec<Regex>,
}
impl Rule for RuleRF05 {
fn load_from_config(&self, config: &AHashMap<String, Value>) -> Result<ErasedRule, String> {
Ok(RuleRF05 {
unquoted_identifiers_policy: config["unquoted_identifiers_policy"]
.as_string()
.unwrap()
.to_owned(),
quoted_identifiers_policy: config["quoted_identifiers_policy"]
.as_string()
.unwrap()
.to_owned(),
ignore_words: config["ignore_words"]
.map(|it| {
it.as_array()
.unwrap()
.iter()
.map(|it| it.as_string().unwrap().to_lowercase())
.collect()
})
.unwrap_or_default(),
ignore_words_regex: config["ignore_words_regex"]
.map(|it| {
it.as_array()
.unwrap()
.iter()
.map(|it| Regex::new(it.as_string().unwrap()).unwrap())
.collect()
})
.unwrap_or_default(),
allow_space_in_identifier: config["allow_space_in_identifier"].as_bool().unwrap(),
additional_allowed_characters: config["additional_allowed_characters"]
.map(|it| it.as_string().unwrap().to_owned())
.unwrap_or_default(),
}
.erased())
}
fn name(&self) -> &'static str {
"references.special_chars"
}
fn description(&self) -> &'static str {
"Do not use special characters in identifiers."
}
fn long_description(&self) -> &'static str {
r"
**Anti-pattern**
Using special characters within identifiers when creating or aliasing objects.
```sql
CREATE TABLE DBO.ColumnNames
(
[Internal Space] INT,
[Greater>Than] INT,
[Less<Than] INT,
Number# INT
)
```
**Best practice**
Identifiers should include only alphanumerics and underscores.
```sql
CREATE TABLE DBO.ColumnNames
(
[Internal_Space] INT,
[GreaterThan] INT,
[LessThan] INT,
NumberVal INT
)
```
"
}
fn groups(&self) -> &'static [RuleGroups] {
&[RuleGroups::All, RuleGroups::References]
}
fn eval(&self, context: RuleContext) -> Vec<LintResult> {
if self
.ignore_words
.contains(&context.segment.raw().to_lowercase())
|| self
.ignore_words_regex
.iter()
.any(|it| it.is_match(context.segment.raw().as_ref()))
{
return Vec::new();
}
let mut policy = self.unquoted_identifiers_policy.as_str();
let mut identifier = context.segment.raw().to_string();
if context.segment.is_type(SyntaxKind::QuotedIdentifier) {
policy = self.quoted_identifiers_policy.as_str();
identifier = identifier[1..identifier.len() - 1].to_string();
if self.ignore_words.contains(&identifier.to_lowercase())
|| self
.ignore_words_regex
.iter()
.any(|it| it.is_match(&identifier))
{
return Vec::new();
}
if context.dialect.name == DialectKind::Bigquery
&& context
.parent_stack
.last()
.map_or(false, |it| it.is_type(SyntaxKind::TableReference))
{
if identifier.ends_with('*') {
identifier.pop();
}
identifier = identifier.replace(".", "");
}
if context.dialect.name == DialectKind::Sparksql && !context.parent_stack.is_empty() {
if context
.parent_stack
.last()
.unwrap()
.is_type(SyntaxKind::FileReference)
{
return Vec::new();
}
if context
.parent_stack
.last()
.unwrap()
.is_type(SyntaxKind::PropertyNameIdentifier)
{
identifier = identifier.replace(".", "");
}
}
if self.allow_space_in_identifier {
identifier = identifier.replace(" ", "");
}
}
identifier = identifier.replace("_", "");
if context.dialect.name == DialectKind::Redshift
&& identifier.starts_with('#')
&& context
.parent_stack
.last()
.map_or(false, |it| it.get_type() == SyntaxKind::TableReference)
{
identifier = identifier[1..].to_string();
}
let additional_allowed_characters =
self.get_additional_allowed_characters(context.dialect.name);
if !additional_allowed_characters.is_empty() {
identifier.retain(|it| !additional_allowed_characters.contains(&it));
}
if identifiers_policy_applicable(policy, &context.parent_stack)
&& !identifier.chars().all(|c| c.is_ascii_alphanumeric())
{
return vec![LintResult::new(
context.segment.into(),
Vec::new(),
None,
None,
)];
}
Vec::new()
}
fn crawl_behaviour(&self) -> Crawler {
SegmentSeekerCrawler::new(
const { SyntaxSet::new(&[SyntaxKind::QuotedIdentifier, SyntaxKind::NakedIdentifier]) },
)
.into()
}
}
impl RuleRF05 {
fn get_additional_allowed_characters(&self, dialect_name: DialectKind) -> AHashSet<char> {
let mut result = AHashSet::new();
result.extend(self.additional_allowed_characters.chars());
if dialect_name == DialectKind::Bigquery {
result.insert('-');
}
result
}
}