Skip to content

Commit

Permalink
Minor: Add documentation explaining that initcap oly works for ASCII (a…
Browse files Browse the repository at this point in the history
  • Loading branch information
alamb authored Dec 13, 2024
1 parent 320e4d6 commit b69fa67
Show file tree
Hide file tree
Showing 2 changed files with 23 additions and 10 deletions.
29 changes: 20 additions & 9 deletions datafusion/functions/src/string/initcap.rs
Original file line number Diff line number Diff line change
Expand Up @@ -90,25 +90,36 @@ fn get_initcap_doc() -> &'static Documentation {
DOCUMENTATION.get_or_init(|| {
Documentation::builder(
DOC_SECTION_STRING,
"Capitalizes the first character in each word in the input string. Words are delimited by non-alphanumeric characters.",
"initcap(str)")
.with_sql_example(r#"```sql
"Capitalizes the first character in each word in the ASCII input string. \
Words are delimited by non-alphanumeric characters.\n\n\
Note this function does not support UTF-8 characters.",
"initcap(str)",
)
.with_sql_example(
r#"```sql
> select initcap('apache datafusion');
+------------------------------------+
| initcap(Utf8("apache datafusion")) |
+------------------------------------+
| Apache Datafusion |
+------------------------------------+
```"#)
.with_standard_argument("str", Some("String"))
.with_related_udf("lower")
.with_related_udf("upper")
.build()
```"#,
)
.with_standard_argument("str", Some("String"))
.with_related_udf("lower")
.with_related_udf("upper")
.build()
})
}

/// Converts the first letter of each word to upper case and the rest to lower case. Words are sequences of alphanumeric characters separated by non-alphanumeric characters.
/// Converts the first letter of each word to upper case and the rest to lower
/// case. Words are sequences of alphanumeric characters separated by
/// non-alphanumeric characters.
///
/// Example:
/// ```sql
/// initcap('hi THOMAS') = 'Hi Thomas'
/// ```
fn initcap<T: OffsetSizeTrait>(args: &[ArrayRef]) -> Result<ArrayRef> {
let string_array = as_generic_string_array::<T>(&args[0])?;

Expand Down
4 changes: 3 additions & 1 deletion docs/source/user-guide/sql/scalar_functions.md
Original file line number Diff line number Diff line change
Expand Up @@ -1046,7 +1046,9 @@ find_in_set(str, strlist)

### `initcap`

Capitalizes the first character in each word in the input string. Words are delimited by non-alphanumeric characters.
Capitalizes the first character in each word in the ASCII input string. Words are delimited by non-alphanumeric characters.

Note this function does not support UTF-8 characters.

```
initcap(str)
Expand Down

0 comments on commit b69fa67

Please sign in to comment.