sqruff_lib/rules/ambiguous/
am05.rsuse std::str::FromStr;
use ahash::AHashMap;
use smol_str::StrExt;
use sqruff_lib_core::dialects::syntax::{SyntaxKind, SyntaxSet};
use sqruff_lib_core::lint_fix::LintFix;
use sqruff_lib_core::parser::segments::base::SegmentBuilder;
use strum_macros::{AsRefStr, EnumString};
use crate::core::config::Value;
use crate::core::rules::base::{Erased, ErasedRule, LintResult, Rule, RuleGroups};
use crate::core::rules::context::RuleContext;
use crate::core::rules::crawlers::{Crawler, SegmentSeekerCrawler};
#[derive(Clone, Debug)]
pub struct RuleAM05 {
fully_qualify_join_types: JoinType,
}
#[derive(Clone, Debug, Copy, PartialEq, Eq, Hash, AsRefStr, EnumString)]
#[strum(serialize_all = "lowercase")]
enum JoinType {
Inner,
Outer,
Both,
}
impl Default for RuleAM05 {
fn default() -> Self {
Self {
fully_qualify_join_types: JoinType::Inner,
}
}
}
impl Rule for RuleAM05 {
fn load_from_config(&self, config: &AHashMap<String, Value>) -> Result<ErasedRule, String> {
let fully_qualify_join_types = config["fully_qualify_join_types"].as_string();
match fully_qualify_join_types {
None => Err("Rule AM05 expects a `fully_qualify_join_types` array".to_string()),
Some(join_type) => {
let join_type = JoinType::from_str(join_type).map_err(|_| {
format!(
"Rule AM05 expects a `fully_qualify_join_types` array of valid join \
types. Got: {}",
join_type
)
})?;
Ok(RuleAM05 {
fully_qualify_join_types: join_type,
}
.erased())
}
}
}
fn name(&self) -> &'static str {
"ambiguous.join"
}
fn description(&self) -> &'static str {
"Join clauses should be fully qualified."
}
fn long_description(&self) -> &'static str {
r#"
**Anti-pattern**
In this example, `UNION DISTINCT` should be preferred over `UNION`, because explicit is better than implicit.
```sql
SELECT a, b FROM table_1
UNION
SELECT a, b FROM table_2
```
**Best practice**
Specify `DISTINCT` or `ALL` after `UNION` (note that `DISTINCT` is the default behavior).
```sql
SELECT a, b FROM table_1
UNION DISTINCT
SELECT a, b FROM table_2
```
"#
}
fn groups(&self) -> &'static [RuleGroups] {
&[RuleGroups::All, RuleGroups::Ambiguous]
}
fn eval(&self, context: RuleContext) -> Vec<LintResult> {
assert!(context.segment.is_type(SyntaxKind::JoinClause));
let join_clause_keywords = context
.segment
.segments()
.iter()
.filter(|segment| segment.is_type(SyntaxKind::Keyword))
.collect::<Vec<_>>();
if (self.fully_qualify_join_types == JoinType::Outer
|| self.fully_qualify_join_types == JoinType::Both)
&& ["RIGHT", "LEFT", "FULL"].contains(
&join_clause_keywords[0]
.raw()
.to_uppercase_smolstr()
.as_str(),
)
&& join_clause_keywords[1].raw().eq_ignore_ascii_case("JOIN")
{
let outer_keyword = if join_clause_keywords[1].raw() == "JOIN" {
"OUTER"
} else {
"outer"
};
return vec![LintResult::new(
context.segment.segments()[0].clone().into(),
vec![LintFix::create_after(
context.segment.segments()[0].clone(),
vec![
SegmentBuilder::whitespace(context.tables.next_id(), " "),
SegmentBuilder::keyword(context.tables.next_id(), outer_keyword),
],
None,
)],
None,
None,
)];
};
if (self.fully_qualify_join_types == JoinType::Inner
|| self.fully_qualify_join_types == JoinType::Both)
&& join_clause_keywords[0].raw().eq_ignore_ascii_case("JOIN")
{
let inner_keyword = if join_clause_keywords[0].raw() == "JOIN" {
"INNER"
} else {
"inner"
};
return vec![LintResult::new(
context.segment.segments()[0].clone().into(),
vec![LintFix::create_before(
context.segment.segments()[0].clone(),
vec![
SegmentBuilder::keyword(context.tables.next_id(), inner_keyword),
SegmentBuilder::whitespace(context.tables.next_id(), " "),
],
)],
None,
None,
)];
}
vec![]
}
fn is_fix_compatible(&self) -> bool {
true
}
fn crawl_behaviour(&self) -> Crawler {
SegmentSeekerCrawler::new(const { SyntaxSet::new(&[SyntaxKind::JoinClause]) }).into()
}
}