132 lines
4.3 KiB
Rust
132 lines
4.3 KiB
Rust
|
// Copyright 2012-2015 The Rust Project Developers. See the COPYRIGHT
|
|||
|
// file at the top-level directory of this distribution and at
|
|||
|
// http://rust-lang.org/COPYRIGHT.
|
|||
|
//
|
|||
|
// Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
|
|||
|
// http://www.apache.org/licenses/LICENSE-2.0> or the MIT license
|
|||
|
// <LICENSE-MIT or http://opensource.org/licenses/MIT>, at your
|
|||
|
// option. This file may not be copied, modified, or distributed
|
|||
|
// except according to those terms.
|
|||
|
|
|||
|
//! Determine displayed width of `char` and `str` types according to
|
|||
|
//! [Unicode Standard Annex #11](http://www.unicode.org/reports/tr11/)
|
|||
|
//! rules.
|
|||
|
//!
|
|||
|
//! ```rust
|
|||
|
//! extern crate unicode_width;
|
|||
|
//!
|
|||
|
//! use unicode_width::UnicodeWidthStr;
|
|||
|
//!
|
|||
|
//! fn main() {
|
|||
|
//! let teststr = "Hello, world!";
|
|||
|
//! let width = UnicodeWidthStr::width(teststr);
|
|||
|
//! println!("{}", teststr);
|
|||
|
//! println!("The above string is {} columns wide.", width);
|
|||
|
//! let width = teststr.width_cjk();
|
|||
|
//! println!("The above string is {} columns wide (CJK).", width);
|
|||
|
//! }
|
|||
|
//! ```
|
|||
|
//!
|
|||
|
//! # features
|
|||
|
//!
|
|||
|
//! unicode-width supports a `no_std` feature. This eliminates dependence
|
|||
|
//! on std, and instead uses equivalent functions from core.
|
|||
|
//!
|
|||
|
//! # crates.io
|
|||
|
//!
|
|||
|
//! You can use this package in your project by adding the following
|
|||
|
//! to your `Cargo.toml`:
|
|||
|
//!
|
|||
|
//! ```toml
|
|||
|
//! [dependencies]
|
|||
|
//! unicode-width = "0.1.5"
|
|||
|
//! ```
|
|||
|
|
|||
|
#![deny(missing_docs, unsafe_code)]
|
|||
|
#![doc(html_logo_url = "https://unicode-rs.github.io/unicode-rs_sm.png",
|
|||
|
html_favicon_url = "https://unicode-rs.github.io/unicode-rs_sm.png")]
|
|||
|
|
|||
|
#![cfg_attr(feature = "bench", feature(test))]
|
|||
|
#![no_std]
|
|||
|
|
|||
|
#[cfg(test)]
|
|||
|
#[macro_use]
|
|||
|
extern crate std;
|
|||
|
|
|||
|
#[cfg(feature = "bench")]
|
|||
|
extern crate test;
|
|||
|
|
|||
|
use tables::charwidth as cw;
|
|||
|
pub use tables::UNICODE_VERSION;
|
|||
|
|
|||
|
use core::ops::Add;
|
|||
|
|
|||
|
mod tables;
|
|||
|
|
|||
|
#[cfg(test)]
|
|||
|
mod tests;
|
|||
|
|
|||
|
/// Methods for determining displayed width of Unicode characters.
|
|||
|
pub trait UnicodeWidthChar {
|
|||
|
/// Returns the character's displayed width in columns, or `None` if the
|
|||
|
/// character is a control character other than `'\x00'`.
|
|||
|
///
|
|||
|
/// This function treats characters in the Ambiguous category according
|
|||
|
/// to [Unicode Standard Annex #11](http://www.unicode.org/reports/tr11/)
|
|||
|
/// as 1 column wide. This is consistent with the recommendations for non-CJK
|
|||
|
/// contexts, or when the context cannot be reliably determined.
|
|||
|
fn width(self) -> Option<usize>;
|
|||
|
|
|||
|
/// Returns the character's displayed width in columns, or `None` if the
|
|||
|
/// character is a control character other than `'\x00'`.
|
|||
|
///
|
|||
|
/// This function treats characters in the Ambiguous category according
|
|||
|
/// to [Unicode Standard Annex #11](http://www.unicode.org/reports/tr11/)
|
|||
|
/// as 2 columns wide. This is consistent with the recommendations for
|
|||
|
/// CJK contexts.
|
|||
|
fn width_cjk(self) -> Option<usize>;
|
|||
|
}
|
|||
|
|
|||
|
impl UnicodeWidthChar for char {
|
|||
|
#[inline]
|
|||
|
fn width(self) -> Option<usize> { cw::width(self, false) }
|
|||
|
|
|||
|
#[inline]
|
|||
|
fn width_cjk(self) -> Option<usize> { cw::width(self, true) }
|
|||
|
}
|
|||
|
|
|||
|
/// Methods for determining displayed width of Unicode strings.
|
|||
|
pub trait UnicodeWidthStr {
|
|||
|
/// Returns the string's displayed width in columns.
|
|||
|
///
|
|||
|
/// Control characters are treated as having zero width.
|
|||
|
///
|
|||
|
/// This function treats characters in the Ambiguous category according
|
|||
|
/// to [Unicode Standard Annex #11](http://www.unicode.org/reports/tr11/)
|
|||
|
/// as 1 column wide. This is consistent with the recommendations for
|
|||
|
/// non-CJK contexts, or when the context cannot be reliably determined.
|
|||
|
fn width<'a>(&'a self) -> usize;
|
|||
|
|
|||
|
/// Returns the string's displayed width in columns.
|
|||
|
///
|
|||
|
/// Control characters are treated as having zero width.
|
|||
|
///
|
|||
|
/// This function treats characters in the Ambiguous category according
|
|||
|
/// to [Unicode Standard Annex #11](http://www.unicode.org/reports/tr11/)
|
|||
|
/// as 2 column wide. This is consistent with the recommendations for
|
|||
|
/// CJK contexts.
|
|||
|
fn width_cjk<'a>(&'a self) -> usize;
|
|||
|
}
|
|||
|
|
|||
|
impl UnicodeWidthStr for str {
|
|||
|
#[inline]
|
|||
|
fn width(&self) -> usize {
|
|||
|
self.chars().map(|c| cw::width(c, false).unwrap_or(0)).fold(0, Add::add)
|
|||
|
}
|
|||
|
|
|||
|
#[inline]
|
|||
|
fn width_cjk(&self) -> usize {
|
|||
|
self.chars().map(|c| cw::width(c, true).unwrap_or(0)).fold(0, Add::add)
|
|||
|
}
|
|||
|
}
|