Use byte indices instead of char indices for text runs

Replace character indices with UTF-8 byte offsets throughout the code dealing
with text shaping and breaking.  This eliminates a lot of complexity when
converting from one to the other, and interoperates better with the rest of
the Rust ecosystem.
This commit is contained in:
Matt Brubeck 2016-04-27 11:22:02 -07:00
parent dba878dfb2
commit 659305fe0a
15 changed files with 259 additions and 437 deletions

View file

@ -43,7 +43,7 @@ use style::computed_values::{border_style, filter, image_rendering, mix_blend_mo
use style::properties::{ComputedValues}; use style::properties::{ComputedValues};
use style_traits::cursor::Cursor; use style_traits::cursor::Cursor;
use text::TextRun; use text::TextRun;
use text::glyph::CharIndex; use text::glyph::ByteIndex;
use util::geometry::{self, MAX_RECT, ScreenPx}; use util::geometry::{self, MAX_RECT, ScreenPx};
use util::print_tree::PrintTree; use util::print_tree::PrintTree;
use webrender_traits::{self, WebGLContextId}; use webrender_traits::{self, WebGLContextId};
@ -989,7 +989,7 @@ pub struct TextDisplayItem {
pub text_run: Arc<TextRun>, pub text_run: Arc<TextRun>,
/// The range of text within the text run. /// The range of text within the text run.
pub range: Range<CharIndex>, pub range: Range<ByteIndex>,
/// The color of the text. /// The color of the text.
pub text_color: Color, pub text_color: Color,

View file

@ -154,7 +154,7 @@ impl Font {
let start_time = time::precise_time_ns(); let start_time = time::precise_time_ns();
let mut glyphs = GlyphStore::new(text.chars().count(), let mut glyphs = GlyphStore::new(text.len(),
options.flags.contains(IS_WHITESPACE_SHAPING_FLAG), options.flags.contains(IS_WHITESPACE_SHAPING_FLAG),
options.flags.contains(RTL_FLAG)); options.flags.contains(RTL_FLAG));
shaper.as_ref().unwrap().shape_text(text, options, &mut glyphs); shaper.as_ref().unwrap().shape_text(text, options, &mut glyphs);

View file

@ -33,7 +33,7 @@ use std::default::Default;
use std::{f32, mem, ptr}; use std::{f32, mem, ptr};
use style::computed_values::{border_style, filter, image_rendering, mix_blend_mode}; use style::computed_values::{border_style, filter, image_rendering, mix_blend_mode};
use text::TextRun; use text::TextRun;
use text::glyph::CharIndex; use text::glyph::ByteIndex;
use util::geometry::{self, MAX_RECT, PagePx, ScreenPx}; use util::geometry::{self, MAX_RECT, PagePx, ScreenPx};
use util::opts; use util::opts;
@ -1768,7 +1768,7 @@ trait ScaledFontExtensionMethods {
fn draw_text(&self, fn draw_text(&self,
draw_target: &DrawTarget, draw_target: &DrawTarget,
run: &TextRun, run: &TextRun,
range: &Range<CharIndex>, range: &Range<ByteIndex>,
baseline_origin: Point2D<Au>, baseline_origin: Point2D<Au>,
color: Color, color: Color,
antialias: bool); antialias: bool);
@ -1779,7 +1779,7 @@ impl ScaledFontExtensionMethods for ScaledFont {
fn draw_text(&self, fn draw_text(&self,
draw_target: &DrawTarget, draw_target: &DrawTarget,
run: &TextRun, run: &TextRun,
range: &Range<CharIndex>, range: &Range<ByteIndex>,
baseline_origin: Point2D<Au>, baseline_origin: Point2D<Au>,
color: Color, color: Color,
antialias: bool) { antialias: bool) {
@ -1795,11 +1795,10 @@ impl ScaledFontExtensionMethods for ScaledFont {
}; };
let mut origin = baseline_origin.clone(); let mut origin = baseline_origin.clone();
let mut azglyphs = vec!(); let mut azglyphs = Vec::with_capacity(range.length().to_usize());
azglyphs.reserve(range.length().to_usize());
for slice in run.natural_word_slices_in_visual_order(range) { for slice in run.natural_word_slices_in_visual_order(range) {
for glyph in slice.glyphs.iter_glyphs_for_char_range(&slice.range) { for glyph in slice.glyphs.iter_glyphs_for_byte_range(&slice.range) {
let glyph_advance = glyph.advance(); let glyph_advance = glyph.advance();
let glyph_offset = glyph.offset().unwrap_or(Point2D::zero()); let glyph_offset = glyph.offset().unwrap_or(Point2D::zero());
let azglyph = struct__AzGlyph { let azglyph = struct__AzGlyph {

View file

@ -164,7 +164,7 @@ impl DetailedGlyph {
#[derive(PartialEq, Clone, Eq, Debug, Copy, Deserialize, Serialize)] #[derive(PartialEq, Clone, Eq, Debug, Copy, Deserialize, Serialize)]
struct DetailedGlyphRecord { struct DetailedGlyphRecord {
// source string offset/GlyphEntry offset in the TextRun // source string offset/GlyphEntry offset in the TextRun
entry_offset: CharIndex, entry_offset: ByteIndex,
// offset into the detailed glyphs buffer // offset into the detailed glyphs buffer
detail_offset: usize, detail_offset: usize,
} }
@ -205,7 +205,7 @@ impl<'a> DetailedGlyphStore {
} }
} }
fn add_detailed_glyphs_for_entry(&mut self, entry_offset: CharIndex, glyphs: &[DetailedGlyph]) { fn add_detailed_glyphs_for_entry(&mut self, entry_offset: ByteIndex, glyphs: &[DetailedGlyph]) {
let entry = DetailedGlyphRecord { let entry = DetailedGlyphRecord {
entry_offset: entry_offset, entry_offset: entry_offset,
detail_offset: self.detail_buffer.len(), detail_offset: self.detail_buffer.len(),
@ -229,7 +229,7 @@ impl<'a> DetailedGlyphStore {
self.lookup_is_sorted = false; self.lookup_is_sorted = false;
} }
fn detailed_glyphs_for_entry(&'a self, entry_offset: CharIndex, count: u16) fn detailed_glyphs_for_entry(&'a self, entry_offset: ByteIndex, count: u16)
-> &'a [DetailedGlyph] { -> &'a [DetailedGlyph] {
debug!("Requesting detailed glyphs[n={}] for entry[off={:?}]", count, entry_offset); debug!("Requesting detailed glyphs[n={}] for entry[off={:?}]", count, entry_offset);
@ -256,7 +256,7 @@ impl<'a> DetailedGlyphStore {
} }
fn detailed_glyph_with_index(&'a self, fn detailed_glyph_with_index(&'a self,
entry_offset: CharIndex, entry_offset: ByteIndex,
detail_offset: u16) detail_offset: u16)
-> &'a DetailedGlyph { -> &'a DetailedGlyph {
assert!((detail_offset as usize) <= self.detail_buffer.len()); assert!((detail_offset as usize) <= self.detail_buffer.len());
@ -336,8 +336,8 @@ impl GlyphData {
// values as they are needed from the GlyphStore, using provided offsets. // values as they are needed from the GlyphStore, using provided offsets.
#[derive(Copy, Clone)] #[derive(Copy, Clone)]
pub enum GlyphInfo<'a> { pub enum GlyphInfo<'a> {
Simple(&'a GlyphStore, CharIndex), Simple(&'a GlyphStore, ByteIndex),
Detail(&'a GlyphStore, CharIndex, u16), Detail(&'a GlyphStore, ByteIndex, u16),
} }
impl<'a> GlyphInfo<'a> { impl<'a> GlyphInfo<'a> {
@ -413,10 +413,10 @@ pub struct GlyphStore {
int_range_index! { int_range_index! {
#[derive(Deserialize, Serialize, RustcEncodable)] #[derive(Deserialize, Serialize, RustcEncodable)]
#[doc = "An index that refers to a character in a text run. This could \ #[doc = "An index that refers to a byte offset in a text run. This could \
point to the middle of a glyph."] point to the middle of a glyph."]
#[derive(HeapSizeOf)] #[derive(HeapSizeOf)]
struct CharIndex(isize) struct ByteIndex(isize)
} }
impl<'a> GlyphStore { impl<'a> GlyphStore {
@ -436,8 +436,8 @@ impl<'a> GlyphStore {
} }
} }
pub fn char_len(&self) -> CharIndex { pub fn len(&self) -> ByteIndex {
CharIndex(self.entry_buffer.len() as isize) ByteIndex(self.entry_buffer.len() as isize)
} }
pub fn is_whitespace(&self) -> bool { pub fn is_whitespace(&self) -> bool {
@ -452,7 +452,7 @@ impl<'a> GlyphStore {
#[inline(never)] #[inline(never)]
fn cache_total_advance(&mut self) { fn cache_total_advance(&mut self) {
let mut total_advance = Au(0); let mut total_advance = Au(0);
for glyph in self.iter_glyphs_for_char_range(&Range::new(CharIndex(0), self.char_len())) { for glyph in self.iter_glyphs_for_byte_range(&Range::new(ByteIndex(0), self.len())) {
total_advance = total_advance + glyph.advance() total_advance = total_advance + glyph.advance()
} }
self.total_advance = total_advance self.total_advance = total_advance
@ -462,10 +462,9 @@ impl<'a> GlyphStore {
self.total_advance self.total_advance
} }
/// Adds a single glyph. If `character` is present, this represents a single character; /// Adds a single glyph.
/// otherwise, this glyph represents multiple characters. pub fn add_glyph_for_byte_index(&mut self,
pub fn add_glyph_for_char_index(&mut self, i: ByteIndex,
i: CharIndex,
character: char, character: char,
data: &GlyphData) { data: &GlyphData) {
let glyph_is_compressible = is_simple_glyph_id(data.id) && let glyph_is_compressible = is_simple_glyph_id(data.id) &&
@ -474,7 +473,7 @@ impl<'a> GlyphStore {
data.cluster_start; // others are stored in detail buffer data.cluster_start; // others are stored in detail buffer
debug_assert!(data.ligature_start); // can't compress ligature continuation glyphs. debug_assert!(data.ligature_start); // can't compress ligature continuation glyphs.
debug_assert!(i < self.char_len()); debug_assert!(i < self.len());
let mut entry = if glyph_is_compressible { let mut entry = if glyph_is_compressible {
GlyphEntry::simple(data.id, data.advance) GlyphEntry::simple(data.id, data.advance)
@ -492,8 +491,8 @@ impl<'a> GlyphStore {
self.entry_buffer[i.to_usize()] = entry; self.entry_buffer[i.to_usize()] = entry;
} }
pub fn add_glyphs_for_char_index(&mut self, i: CharIndex, data_for_glyphs: &[GlyphData]) { pub fn add_glyphs_for_byte_index(&mut self, i: ByteIndex, data_for_glyphs: &[GlyphData]) {
assert!(i < self.char_len()); assert!(i < self.len());
assert!(data_for_glyphs.len() > 0); assert!(data_for_glyphs.len() > 0);
let glyph_count = data_for_glyphs.len(); let glyph_count = data_for_glyphs.len();
@ -518,48 +517,48 @@ impl<'a> GlyphStore {
} }
#[inline] #[inline]
pub fn iter_glyphs_for_char_range(&'a self, rang: &Range<CharIndex>) -> GlyphIterator<'a> { pub fn iter_glyphs_for_byte_range(&'a self, range: &Range<ByteIndex>) -> GlyphIterator<'a> {
if rang.begin() >= self.char_len() { if range.begin() >= self.len() {
panic!("iter_glyphs_for_range: range.begin beyond length!"); panic!("iter_glyphs_for_range: range.begin beyond length!");
} }
if rang.end() > self.char_len() { if range.end() > self.len() {
panic!("iter_glyphs_for_range: range.end beyond length!"); panic!("iter_glyphs_for_range: range.end beyond length!");
} }
GlyphIterator { GlyphIterator {
store: self, store: self,
char_index: if self.is_rtl { rang.end() } else { rang.begin() - CharIndex(1) }, byte_index: if self.is_rtl { range.end() } else { range.begin() - ByteIndex(1) },
char_range: *rang, byte_range: *range,
glyph_range: None, glyph_range: None,
} }
} }
#[inline] #[inline]
pub fn advance_for_char_range(&self, rang: &Range<CharIndex>) -> Au { pub fn advance_for_byte_range(&self, range: &Range<ByteIndex>) -> Au {
if rang.begin() == CharIndex(0) && rang.end() == self.char_len() { if range.begin() == ByteIndex(0) && range.end() == self.len() {
self.total_advance self.total_advance
} else if !self.has_detailed_glyphs { } else if !self.has_detailed_glyphs {
self.advance_for_char_range_simple_glyphs(rang) self.advance_for_byte_range_simple_glyphs(range)
} else { } else {
self.advance_for_char_range_slow_path(rang) self.advance_for_byte_range_slow_path(range)
} }
} }
#[inline] #[inline]
pub fn advance_for_char_range_slow_path(&self, rang: &Range<CharIndex>) -> Au { pub fn advance_for_byte_range_slow_path(&self, range: &Range<ByteIndex>) -> Au {
self.iter_glyphs_for_char_range(rang) self.iter_glyphs_for_byte_range(range)
.fold(Au(0), |advance, glyph| advance + glyph.advance()) .fold(Au(0), |advance, glyph| advance + glyph.advance())
} }
#[inline] #[inline]
#[cfg(any(target_arch = "x86_64", target_arch = "aarch64"))] #[cfg(any(target_arch = "x86_64", target_arch = "aarch64"))]
fn advance_for_char_range_simple_glyphs(&self, rang: &Range<CharIndex>) -> Au { fn advance_for_byte_range_simple_glyphs(&self, range: &Range<ByteIndex>) -> Au {
let mask = u32x4::splat(GLYPH_ADVANCE_MASK); let mask = u32x4::splat(GLYPH_ADVANCE_MASK);
let mut simd_advance = u32x4::splat(0); let mut simd_advance = u32x4::splat(0);
let begin = rang.begin().to_usize(); let begin = range.begin().to_usize();
let len = rang.length().to_usize(); let len = range.length().to_usize();
let num_simd_iterations = len / 4; let num_simd_iterations = len / 4;
let leftover_entries = rang.end().to_usize() - (len - num_simd_iterations * 4); let leftover_entries = range.end().to_usize() - (len - num_simd_iterations * 4);
let buf = self.transmute_entry_buffer_to_u32_buffer(); let buf = self.transmute_entry_buffer_to_u32_buffer();
for i in 0..num_simd_iterations { for i in 0..num_simd_iterations {
@ -575,7 +574,7 @@ impl<'a> GlyphStore {
simd_advance.extract(2) + simd_advance.extract(2) +
simd_advance.extract(3)) as i32; simd_advance.extract(3)) as i32;
let mut leftover = Au(0); let mut leftover = Au(0);
for i in leftover_entries..rang.end().to_usize() { for i in leftover_entries..range.end().to_usize() {
leftover = leftover + self.entry_buffer[i].advance(); leftover = leftover + self.entry_buffer[i].advance();
} }
Au(advance) + leftover Au(advance) + leftover
@ -584,8 +583,8 @@ impl<'a> GlyphStore {
/// When SIMD isn't available (non-x86_x64/aarch64), fallback to the slow path. /// When SIMD isn't available (non-x86_x64/aarch64), fallback to the slow path.
#[inline] #[inline]
#[cfg(not(any(target_arch = "x86_64", target_arch = "aarch64")))] #[cfg(not(any(target_arch = "x86_64", target_arch = "aarch64")))]
fn advance_for_char_range_simple_glyphs(&self, rang: &Range<CharIndex>) -> Au { fn advance_for_byte_range_simple_glyphs(&self, range: &Range<ByteIndex>) -> Au {
self.advance_for_char_range_slow_path(rang) self.advance_for_byte_range_slow_path(range)
} }
/// Used for SIMD. /// Used for SIMD.
@ -595,12 +594,12 @@ impl<'a> GlyphStore {
unsafe { mem::transmute(self.entry_buffer.as_slice()) } unsafe { mem::transmute(self.entry_buffer.as_slice()) }
} }
pub fn char_is_space(&self, i: CharIndex) -> bool { pub fn char_is_space(&self, i: ByteIndex) -> bool {
assert!(i < self.char_len()); assert!(i < self.len());
self.entry_buffer[i.to_usize()].char_is_space() self.entry_buffer[i.to_usize()].char_is_space()
} }
pub fn space_count_in_range(&self, range: &Range<CharIndex>) -> u32 { pub fn space_count_in_range(&self, range: &Range<ByteIndex>) -> u32 {
let mut spaces = 0; let mut spaces = 0;
for index in range.each_index() { for index in range.each_index() {
if self.char_is_space(index) { if self.char_is_space(index) {
@ -610,7 +609,7 @@ impl<'a> GlyphStore {
spaces spaces
} }
pub fn distribute_extra_space_in_range(&mut self, range: &Range<CharIndex>, space: f64) { pub fn distribute_extra_space_in_range(&mut self, range: &Range<ByteIndex>, space: f64) {
debug_assert!(space >= 0.0); debug_assert!(space >= 0.0);
if range.is_empty() { if range.is_empty() {
return return
@ -659,12 +658,12 @@ impl fmt::Debug for GlyphStore {
} }
} }
/// An iterator over the glyphs in a character range in a `GlyphStore`. /// An iterator over the glyphs in a byte range in a `GlyphStore`.
pub struct GlyphIterator<'a> { pub struct GlyphIterator<'a> {
store: &'a GlyphStore, store: &'a GlyphStore,
char_index: CharIndex, byte_index: ByteIndex,
char_range: Range<CharIndex>, byte_range: Range<ByteIndex>,
glyph_range: Option<EachIndex<isize, CharIndex>>, glyph_range: Option<EachIndex<isize, ByteIndex>>,
} }
impl<'a> GlyphIterator<'a> { impl<'a> GlyphIterator<'a> {
@ -673,7 +672,7 @@ impl<'a> GlyphIterator<'a> {
fn next_glyph_range(&mut self) -> Option<GlyphInfo<'a>> { fn next_glyph_range(&mut self) -> Option<GlyphInfo<'a>> {
match self.glyph_range.as_mut().unwrap().next() { match self.glyph_range.as_mut().unwrap().next() {
Some(j) => { Some(j) => {
Some(GlyphInfo::Detail(self.store, self.char_index, j.get() as u16 /* ??? */)) Some(GlyphInfo::Detail(self.store, self.byte_index, j.get() as u16 /* ??? */))
} }
None => { None => {
// No more glyphs for current character. Try to get another. // No more glyphs for current character. Try to get another.
@ -685,9 +684,9 @@ impl<'a> GlyphIterator<'a> {
// Slow path when there is a complex glyph. // Slow path when there is a complex glyph.
#[inline(never)] #[inline(never)]
fn next_complex_glyph(&mut self, entry: &GlyphEntry, i: CharIndex) -> Option<GlyphInfo<'a>> { fn next_complex_glyph(&mut self, entry: &GlyphEntry, i: ByteIndex) -> Option<GlyphInfo<'a>> {
let glyphs = self.store.detail_store.detailed_glyphs_for_entry(i, entry.glyph_count()); let glyphs = self.store.detail_store.detailed_glyphs_for_entry(i, entry.glyph_count());
self.glyph_range = Some(range::each_index(CharIndex(0), CharIndex(glyphs.len() as isize))); self.glyph_range = Some(range::each_index(ByteIndex(0), ByteIndex(glyphs.len() as isize)));
self.next() self.next()
} }
} }
@ -708,17 +707,17 @@ impl<'a> Iterator for GlyphIterator<'a> {
return self.next_glyph_range() return self.next_glyph_range()
} }
// No glyph range. Look at next character. // No glyph range. Look at next byte.
self.char_index = self.char_index + if self.store.is_rtl { self.byte_index = self.byte_index + if self.store.is_rtl {
CharIndex(-1) ByteIndex(-1)
} else { } else {
CharIndex(1) ByteIndex(1)
}; };
let i = self.char_index; let i = self.byte_index;
if !self.char_range.contains(i) { if !self.byte_range.contains(i) {
return None return None
} }
debug_assert!(i < self.store.char_len()); debug_assert!(i < self.store.len());
let entry = self.store.entry_buffer[i.to_usize()]; let entry = self.store.entry_buffer[i.to_usize()];
if entry.is_simple() { if entry.is_simple() {
Some(GlyphInfo::Simple(self.store, i)) Some(GlyphInfo::Simple(self.store, i))

View file

@ -35,7 +35,7 @@ use harfbuzz::{hb_position_t, hb_tag_t};
use libc::{c_char, c_int, c_uint, c_void}; use libc::{c_char, c_int, c_uint, c_void};
use platform::font::FontTable; use platform::font::FontTable;
use std::{char, cmp, ptr}; use std::{char, cmp, ptr};
use text::glyph::{CharIndex, GlyphData, GlyphId, GlyphStore}; use text::glyph::{ByteIndex, GlyphData, GlyphId, GlyphStore};
use text::shaping::ShaperMethods; use text::shaping::ShaperMethods;
use text::util::{fixed_to_float, float_to_fixed, is_bidi_control}; use text::util::{fixed_to_float, float_to_fixed, is_bidi_control};
@ -45,8 +45,7 @@ macro_rules! hb_tag {
); );
} }
static NO_GLYPH: i32 = -1; const NO_GLYPH: i32 = -1;
static CONTINUATION_BYTE: i32 = -2;
static KERN: u32 = hb_tag!('k', 'e', 'r', 'n'); static KERN: u32 = hb_tag!('k', 'e', 'r', 'n');
static LIGA: u32 = hb_tag!('l', 'i', 'g', 'a'); static LIGA: u32 = hb_tag!('l', 'i', 'g', 'a');
@ -258,44 +257,18 @@ impl Shaper {
let glyph_data = ShapedGlyphData::new(buffer); let glyph_data = ShapedGlyphData::new(buffer);
let glyph_count = glyph_data.len(); let glyph_count = glyph_data.len();
let byte_max = text.len(); let byte_max = text.len();
let char_max = text.chars().count();
// GlyphStore records are indexed by character, not byte offset. debug!("Shaped text[byte count={}], got back {} glyph info records.",
// so, we must be careful to increment this when saving glyph entries. byte_max,
let (mut char_idx, char_step) = if options.flags.contains(RTL_FLAG) {
(CharIndex(char_max as isize - 1), CharIndex(-1))
} else {
(CharIndex(0), CharIndex(1))
};
debug!("Shaped text[char count={}], got back {} glyph info records.",
char_max,
glyph_count); glyph_count);
if char_max != glyph_count {
debug!("NOTE: Since these are not equal, we probably have been given some complex \
glyphs.");
}
// make map of what chars have glyphs // make map of what chars have glyphs
let mut byte_to_glyph: Vec<i32>; let mut byte_to_glyph = vec![NO_GLYPH; byte_max];
// fast path: all chars are single-byte.
if byte_max == char_max {
byte_to_glyph = vec![NO_GLYPH; byte_max];
} else {
byte_to_glyph = vec![CONTINUATION_BYTE; byte_max];
for (i, _) in text.char_indices() {
byte_to_glyph[i] = NO_GLYPH;
}
}
debug!("(glyph idx) -> (text byte offset)"); debug!("(glyph idx) -> (text byte offset)");
for i in 0..glyph_data.len() { for i in 0..glyph_data.len() {
// loc refers to a *byte* offset within the utf8 string.
let loc = glyph_data.byte_offset_of_glyph(i) as usize; let loc = glyph_data.byte_offset_of_glyph(i) as usize;
if loc < byte_max { if loc < byte_max {
assert!(byte_to_glyph[loc] != CONTINUATION_BYTE);
byte_to_glyph[loc] = i as i32; byte_to_glyph[loc] = i as i32;
} else { } else {
debug!("ERROR: tried to set out of range byte_to_glyph: idx={}, glyph idx={}", debug!("ERROR: tried to set out of range byte_to_glyph: idx={}, glyph idx={}",
@ -312,10 +285,7 @@ impl Shaper {
} }
let mut glyph_span = 0..0; let mut glyph_span = 0..0;
let mut byte_range = 0..0;
// This span contains first byte of first char, to last byte of last char in range.
// So, char_byte_span.end points to first byte of last+1 char, if it's less than byte_max.
let mut char_byte_span;
let mut y_pos = Au(0); let mut y_pos = Au(0);
@ -325,106 +295,62 @@ impl Shaper {
while glyph_span.start < glyph_count { while glyph_span.start < glyph_count {
debug!("Processing glyph at idx={}", glyph_span.start); debug!("Processing glyph at idx={}", glyph_span.start);
glyph_span.end = glyph_span.start; glyph_span.end = glyph_span.start;
byte_range.end = glyph_data.byte_offset_of_glyph(glyph_span.start) as usize;
let char_byte_start = glyph_data.byte_offset_of_glyph(glyph_span.start) as usize; while byte_range.end < byte_max {
char_byte_span = char_byte_start..char_byte_start; byte_range.end += 1;
let mut glyph_spans_multiple_characters = false; // Extend the byte range to include any following byte without its own glyph.
while byte_range.end < byte_max && byte_to_glyph[byte_range.end] == NO_GLYPH {
// find a range of chars corresponding to this glyph, plus byte_range.end += 1;
// any trailing chars that do not have associated glyphs.
while char_byte_span.end < byte_max {
let ch = text[char_byte_span.end..].chars().next().unwrap();
char_byte_span.end += ch.len_utf8();
debug!("Processing char byte span: off={}, len={} for glyph idx={}",
char_byte_span.start, char_byte_span.len(), glyph_span.start);
while char_byte_span.end != byte_max &&
byte_to_glyph[char_byte_span.end] == NO_GLYPH {
debug!("Extending char byte span to include byte offset={} with no associated \
glyph", char_byte_span.end);
let ch = text[char_byte_span.end..].chars().next().unwrap();
char_byte_span.end += ch.len_utf8();
glyph_spans_multiple_characters = true;
} }
// extend glyph range to max glyph index covered by char_span, // Extend the glyph range to include all glyphs covered by bytes processed so far.
// in cases where one char made several glyphs and left some unassociated chars.
let mut max_glyph_idx = glyph_span.end; let mut max_glyph_idx = glyph_span.end;
for i in char_byte_span.clone() { for glyph_idx in &byte_to_glyph[byte_range.clone()] {
if byte_to_glyph[i] > NO_GLYPH { if *glyph_idx != NO_GLYPH {
max_glyph_idx = cmp::max(byte_to_glyph[i] as usize + 1, max_glyph_idx); max_glyph_idx = cmp::max(*glyph_idx as usize + 1, max_glyph_idx);
} }
} }
if max_glyph_idx > glyph_span.end { if max_glyph_idx > glyph_span.end {
glyph_span.end = max_glyph_idx; glyph_span.end = max_glyph_idx;
debug!("Extended glyph span (off={}, len={}) to cover char byte span's max \ debug!("Extended glyph span to {:?}", glyph_span);
glyph index",
glyph_span.start, glyph_span.len());
} }
// if there's just one glyph, then we don't need further checks. // if there's just one glyph, then we don't need further checks.
if glyph_span.len() == 1 { break; } if glyph_span.len() == 1 { break; }
// if no glyphs were found yet, extend the char byte range more. // if no glyphs were found yet, extend the char byte range more.
if glyph_span.len() == 0 { continue; } if glyph_span.len() == 0 { continue; }
debug!("Complex (multi-glyph to multi-char) association found. This case \ // If byte_range now includes all the byte offsets found in glyph_span, then we
probably doesn't work."); // have found a contiguous "cluster" and can stop extending it.
let mut all_glyphs_are_within_cluster: bool = true; let mut all_glyphs_are_within_cluster: bool = true;
for j in glyph_span.clone() { for j in glyph_span.clone() {
let loc = glyph_data.byte_offset_of_glyph(j); let loc = glyph_data.byte_offset_of_glyph(j);
if !char_byte_span.contains(loc as usize) { if !byte_range.contains(loc as usize) {
all_glyphs_are_within_cluster = false; all_glyphs_are_within_cluster = false;
break break
} }
} }
debug!("All glyphs within char_byte_span cluster?: {}",
all_glyphs_are_within_cluster);
// found a valid range; stop extending char_span.
if all_glyphs_are_within_cluster { if all_glyphs_are_within_cluster {
break break
} }
// Otherwise, the bytes we have seen so far correspond to a non-contiguous set of
// glyphs. Keep extending byte_range until we fill in all the holes in the glyph
// span or reach the end of the text.
} }
// character/glyph clump must contain characters. assert!(byte_range.len() > 0);
assert!(char_byte_span.len() > 0);
// character/glyph clump must contain glyphs.
assert!(glyph_span.len() > 0); assert!(glyph_span.len() > 0);
// now char_span is a ligature clump, formed by the glyphs in glyph_span. // Now byte_range is the ligature clump formed by the glyphs in glyph_span.
// we need to find the chars that correspond to actual glyphs (char_extended_span), // We will save these glyphs to the glyph store at the index of the first byte.
//and set glyph info for those and empty infos for the chars that are continuations. let byte_idx = ByteIndex(byte_range.start as isize);
// a simple example: if glyph_span.len() == 1 {
// chars: 'f' 't' 't' // Fast path: 1-to-1 mapping of byte offset to single glyph.
// glyphs: 'ftt' '' '' //
// cgmap: t f f
// gspan: [-]
// cspan: [-]
// covsp: [---------------]
let mut covered_byte_span = char_byte_span.clone();
// extend, clipping at end of text range.
while covered_byte_span.end < byte_max &&
byte_to_glyph[covered_byte_span.end] == NO_GLYPH {
let ch = text[covered_byte_span.end..].chars().next().unwrap();
covered_byte_span.end += ch.len_utf8();
}
if covered_byte_span.start >= byte_max {
// oops, out of range. clip and forget this clump.
glyph_span.start = glyph_span.end;
char_byte_span.start = char_byte_span.end;
}
// fast path: 1-to-1 mapping of single char and single glyph.
if glyph_span.len() == 1 && !glyph_spans_multiple_characters {
// TODO(Issue #214): cluster ranges need to be computed before // TODO(Issue #214): cluster ranges need to be computed before
// shaping, and then consulted here. // shaping, and then consulted here.
// for now, just pretend that every character is a cluster start. // for now, just pretend that every character is a cluster start.
@ -433,7 +359,7 @@ impl Shaper {
// //
// NB: When we acquire the ability to handle ligatures that cross word boundaries, // NB: When we acquire the ability to handle ligatures that cross word boundaries,
// we'll need to do something special to handle `word-spacing` properly. // we'll need to do something special to handle `word-spacing` properly.
let character = text[char_byte_span.clone()].chars().next().unwrap(); let character = text[byte_range.clone()].chars().next().unwrap();
if is_bidi_control(character) { if is_bidi_control(character) {
// Don't add any glyphs for bidi control chars // Don't add any glyphs for bidi control chars
} else if character == '\t' { } else if character == '\t' {
@ -449,7 +375,7 @@ impl Shaper {
Default::default(), Default::default(),
true, true,
true); true);
glyphs.add_glyph_for_char_index(char_idx, character, &data); glyphs.add_glyph_for_byte_index(byte_idx, character, &data);
} else { } else {
let shape = glyph_data.entry_for_glyph(glyph_span.start, &mut y_pos); let shape = glyph_data.entry_for_glyph(glyph_span.start, &mut y_pos);
let advance = self.advance_for_shaped_glyph(shape.advance, character, options); let advance = self.advance_for_shaped_glyph(shape.advance, character, options);
@ -458,7 +384,7 @@ impl Shaper {
shape.offset, shape.offset,
true, true,
true); true);
glyphs.add_glyph_for_char_index(char_idx, character, &data); glyphs.add_glyph_for_byte_index(byte_idx, character, &data);
} }
} else { } else {
// collect all glyphs to be assigned to the first character. // collect all glyphs to be assigned to the first character.
@ -473,15 +399,12 @@ impl Shaper {
glyph_i > glyph_span.start)); glyph_i > glyph_span.start));
// all but first are ligature continuations // all but first are ligature continuations
} }
// now add the detailed glyph entry. // now add the detailed glyph entry.
glyphs.add_glyphs_for_char_index(char_idx, &datas); glyphs.add_glyphs_for_byte_index(byte_idx, &datas);
} }
// shift up our working spans past things we just handled.
glyph_span.start = glyph_span.end; glyph_span.start = glyph_span.end;
char_byte_span.start = char_byte_span.end; byte_range.start = byte_range.end;
char_idx = char_idx + char_step;
} }
// this must be called after adding all glyph data; it sorts the // this must be called after adding all glyph data; it sorts the

View file

@ -11,11 +11,11 @@ use std::cell::Cell;
use std::cmp::{Ordering, max}; use std::cmp::{Ordering, max};
use std::slice::Iter; use std::slice::Iter;
use std::sync::Arc; use std::sync::Arc;
use text::glyph::{CharIndex, GlyphStore}; use text::glyph::{ByteIndex, GlyphStore};
use webrender_traits; use webrender_traits;
thread_local! { thread_local! {
static INDEX_OF_FIRST_GLYPH_RUN_CACHE: Cell<Option<(*const TextRun, CharIndex, usize)>> = static INDEX_OF_FIRST_GLYPH_RUN_CACHE: Cell<Option<(*const TextRun, ByteIndex, usize)>> =
Cell::new(None) Cell::new(None)
} }
@ -51,19 +51,19 @@ impl Drop for TextRun {
pub struct GlyphRun { pub struct GlyphRun {
/// The glyphs. /// The glyphs.
pub glyph_store: Arc<GlyphStore>, pub glyph_store: Arc<GlyphStore>,
/// The range of characters in the containing run. /// The byte range of characters in the containing run.
pub range: Range<CharIndex>, pub range: Range<ByteIndex>,
} }
pub struct NaturalWordSliceIterator<'a> { pub struct NaturalWordSliceIterator<'a> {
glyphs: &'a [GlyphRun], glyphs: &'a [GlyphRun],
index: usize, index: usize,
range: Range<CharIndex>, range: Range<ByteIndex>,
reverse: bool, reverse: bool,
} }
impl GlyphRun { impl GlyphRun {
fn compare(&self, key: &CharIndex) -> Ordering { fn compare(&self, key: &ByteIndex) -> Ordering {
if *key < self.range.begin() { if *key < self.range.begin() {
Ordering::Greater Ordering::Greater
} else if *key >= self.range.end() { } else if *key >= self.range.end() {
@ -79,16 +79,16 @@ impl GlyphRun {
pub struct TextRunSlice<'a> { pub struct TextRunSlice<'a> {
/// The glyph store that the glyphs in this slice belong to. /// The glyph store that the glyphs in this slice belong to.
pub glyphs: &'a GlyphStore, pub glyphs: &'a GlyphStore,
/// The character index that this slice begins at, relative to the start of the *text run*. /// The byte index that this slice begins at, relative to the start of the *text run*.
pub offset: CharIndex, pub offset: ByteIndex,
/// The range that these glyphs encompass, relative to the start of the *glyph store*. /// The range that these glyphs encompass, relative to the start of the *glyph store*.
pub range: Range<CharIndex>, pub range: Range<ByteIndex>,
} }
impl<'a> TextRunSlice<'a> { impl<'a> TextRunSlice<'a> {
/// Returns the range that these glyphs encompass, relative to the start of the *text run*. /// Returns the range that these glyphs encompass, relative to the start of the *text run*.
#[inline] #[inline]
pub fn text_run_range(&self) -> Range<CharIndex> { pub fn text_run_range(&self) -> Range<ByteIndex> {
let mut range = self.range; let mut range = self.range;
range.shift_by(self.offset); range.shift_by(self.offset);
range range
@ -116,15 +116,15 @@ impl<'a> Iterator for NaturalWordSliceIterator<'a> {
self.index += 1; self.index += 1;
} }
let mut char_range = self.range.intersect(&slice_glyphs.range); let mut byte_range = self.range.intersect(&slice_glyphs.range);
let slice_range_begin = slice_glyphs.range.begin(); let slice_range_begin = slice_glyphs.range.begin();
char_range.shift_by(-slice_range_begin); byte_range.shift_by(-slice_range_begin);
if !char_range.is_empty() { if !byte_range.is_empty() {
Some(TextRunSlice { Some(TextRunSlice {
glyphs: &*slice_glyphs.glyph_store, glyphs: &*slice_glyphs.glyph_store,
offset: slice_range_begin, offset: slice_range_begin,
range: char_range, range: byte_range,
}) })
} else { } else {
None None
@ -133,9 +133,10 @@ impl<'a> Iterator for NaturalWordSliceIterator<'a> {
} }
pub struct CharacterSliceIterator<'a> { pub struct CharacterSliceIterator<'a> {
text: &'a str,
glyph_run: Option<&'a GlyphRun>, glyph_run: Option<&'a GlyphRun>,
glyph_run_iter: Iter<'a, GlyphRun>, glyph_run_iter: Iter<'a, GlyphRun>,
range: Range<CharIndex>, range: Range<ByteIndex>,
} }
impl<'a> Iterator for CharacterSliceIterator<'a> { impl<'a> Iterator for CharacterSliceIterator<'a> {
@ -150,8 +151,13 @@ impl<'a> Iterator for CharacterSliceIterator<'a> {
}; };
debug_assert!(!self.range.is_empty()); debug_assert!(!self.range.is_empty());
let index_to_return = self.range.begin(); let byte_start = self.range.begin();
self.range.adjust_by(CharIndex(1), CharIndex(-1)); let byte_len = match self.text[byte_start.to_usize()..].chars().next() {
Some(ch) => ByteIndex(ch.len_utf8() as isize),
None => unreachable!() // XXX refactor?
};
self.range.adjust_by(byte_len, -byte_len);
if self.range.is_empty() { if self.range.is_empty() {
// We're done. // We're done.
self.glyph_run = None self.glyph_run = None
@ -160,11 +166,11 @@ impl<'a> Iterator for CharacterSliceIterator<'a> {
self.glyph_run = self.glyph_run_iter.next(); self.glyph_run = self.glyph_run_iter.next();
} }
let index_within_glyph_run = index_to_return - glyph_run.range.begin(); let index_within_glyph_run = byte_start - glyph_run.range.begin();
Some(TextRunSlice { Some(TextRunSlice {
glyphs: &*glyph_run.glyph_store, glyphs: &*glyph_run.glyph_store,
offset: glyph_run.range.begin(), offset: glyph_run.range.begin(),
range: Range::new(index_within_glyph_run, CharIndex(1)), range: Range::new(index_within_glyph_run, byte_len),
}) })
} }
} }
@ -187,9 +193,9 @@ impl<'a> TextRun {
-> Vec<GlyphRun> { -> Vec<GlyphRun> {
// TODO(Issue #230): do a better job. See Gecko's LineBreaker. // TODO(Issue #230): do a better job. See Gecko's LineBreaker.
let mut glyphs = vec!(); let mut glyphs = vec!();
let (mut byte_i, mut char_i) = (0, CharIndex(0)); let mut byte_i = 0;
let mut cur_slice_is_whitespace = false; let mut cur_slice_is_whitespace = false;
let (mut byte_last_boundary, mut char_last_boundary) = (0, CharIndex(0)); let mut byte_last_boundary = 0;
for ch in text.chars() { for ch in text.chars() {
// Slices alternate between whitespace and non-whitespace, // Slices alternate between whitespace and non-whitespace,
@ -225,14 +231,13 @@ impl<'a> TextRun {
glyphs.push(GlyphRun { glyphs.push(GlyphRun {
glyph_store: font.shape_text(slice, &options), glyph_store: font.shape_text(slice, &options),
range: Range::new(char_last_boundary, char_i - char_last_boundary), range: Range::new(ByteIndex(byte_last_boundary as isize),
ByteIndex((byte_i - byte_last_boundary) as isize)),
}); });
byte_last_boundary = byte_i; byte_last_boundary = byte_i;
char_last_boundary = char_i;
} }
byte_i = byte_i + ch.len_utf8(); byte_i = byte_i + ch.len_utf8();
char_i = char_i + CharIndex(1);
} }
// Create a glyph store for the final slice if it's nonempty. // Create a glyph store for the final slice if it's nonempty.
@ -248,7 +253,8 @@ impl<'a> TextRun {
glyphs.push(GlyphRun { glyphs.push(GlyphRun {
glyph_store: font.shape_text(slice, &options), glyph_store: font.shape_text(slice, &options),
range: Range::new(char_last_boundary, char_i - char_last_boundary), range: Range::new(ByteIndex(byte_last_boundary as isize),
ByteIndex((byte_i - byte_last_boundary) as isize)),
}); });
} }
@ -263,7 +269,7 @@ impl<'a> TextRun {
self.font_metrics.descent self.font_metrics.descent
} }
pub fn advance_for_range(&self, range: &Range<CharIndex>) -> Au { pub fn advance_for_range(&self, range: &Range<ByteIndex>) -> Au {
if range.is_empty() { if range.is_empty() {
return Au(0) return Au(0)
} }
@ -272,24 +278,24 @@ impl<'a> TextRun {
// TODO(Issue #98): using inter-char and inter-word spacing settings when measuring text // TODO(Issue #98): using inter-char and inter-word spacing settings when measuring text
self.natural_word_slices_in_range(range) self.natural_word_slices_in_range(range)
.fold(Au(0), |advance, slice| { .fold(Au(0), |advance, slice| {
advance + slice.glyphs.advance_for_char_range(&slice.range) advance + slice.glyphs.advance_for_byte_range(&slice.range)
}) })
} }
pub fn metrics_for_range(&self, range: &Range<CharIndex>) -> RunMetrics { pub fn metrics_for_range(&self, range: &Range<ByteIndex>) -> RunMetrics {
RunMetrics::new(self.advance_for_range(range), RunMetrics::new(self.advance_for_range(range),
self.font_metrics.ascent, self.font_metrics.ascent,
self.font_metrics.descent) self.font_metrics.descent)
} }
pub fn metrics_for_slice(&self, glyphs: &GlyphStore, slice_range: &Range<CharIndex>) pub fn metrics_for_slice(&self, glyphs: &GlyphStore, slice_range: &Range<ByteIndex>)
-> RunMetrics { -> RunMetrics {
RunMetrics::new(glyphs.advance_for_char_range(slice_range), RunMetrics::new(glyphs.advance_for_byte_range(slice_range),
self.font_metrics.ascent, self.font_metrics.ascent,
self.font_metrics.descent) self.font_metrics.descent)
} }
pub fn min_width_for_range(&self, range: &Range<CharIndex>) -> Au { pub fn min_width_for_range(&self, range: &Range<ByteIndex>) -> Au {
debug!("iterating outer range {:?}", range); debug!("iterating outer range {:?}", range);
self.natural_word_slices_in_range(range).fold(Au(0), |max_piece_width, slice| { self.natural_word_slices_in_range(range).fold(Au(0), |max_piece_width, slice| {
debug!("iterated on {:?}[{:?}]", slice.offset, slice.range); debug!("iterated on {:?}[{:?}]", slice.offset, slice.range);
@ -297,8 +303,8 @@ impl<'a> TextRun {
}) })
} }
/// Returns the index of the first glyph run containing the given character index. /// Returns the index of the first glyph run containing the given byte index.
fn index_of_first_glyph_run_containing(&self, index: CharIndex) -> Option<usize> { fn index_of_first_glyph_run_containing(&self, index: ByteIndex) -> Option<usize> {
let self_ptr = self as *const TextRun; let self_ptr = self as *const TextRun;
INDEX_OF_FIRST_GLYPH_RUN_CACHE.with(|index_of_first_glyph_run_cache| { INDEX_OF_FIRST_GLYPH_RUN_CACHE.with(|index_of_first_glyph_run_cache| {
if let Some((last_text_run, last_index, last_result)) = if let Some((last_text_run, last_index, last_result)) =
@ -319,7 +325,7 @@ impl<'a> TextRun {
/// Returns an iterator that will iterate over all slices of glyphs that represent natural /// Returns an iterator that will iterate over all slices of glyphs that represent natural
/// words in the given range. /// words in the given range.
pub fn natural_word_slices_in_range(&'a self, range: &Range<CharIndex>) pub fn natural_word_slices_in_range(&'a self, range: &Range<ByteIndex>)
-> NaturalWordSliceIterator<'a> { -> NaturalWordSliceIterator<'a> {
let index = match self.index_of_first_glyph_run_containing(range.begin()) { let index = match self.index_of_first_glyph_run_containing(range.begin()) {
None => self.glyphs.len(), None => self.glyphs.len(),
@ -335,13 +341,13 @@ impl<'a> TextRun {
/// Returns an iterator that over natural word slices in visual order (left to right or /// Returns an iterator that over natural word slices in visual order (left to right or
/// right to left, depending on the bidirectional embedding level). /// right to left, depending on the bidirectional embedding level).
pub fn natural_word_slices_in_visual_order(&'a self, range: &Range<CharIndex>) pub fn natural_word_slices_in_visual_order(&'a self, range: &Range<ByteIndex>)
-> NaturalWordSliceIterator<'a> { -> NaturalWordSliceIterator<'a> {
// Iterate in reverse order if bidi level is RTL. // Iterate in reverse order if bidi level is RTL.
let reverse = self.bidi_level % 2 == 1; let reverse = self.bidi_level % 2 == 1;
let index = if reverse { let index = if reverse {
match self.index_of_first_glyph_run_containing(range.end() - CharIndex(1)) { match self.index_of_first_glyph_run_containing(range.end() - ByteIndex(1)) {
Some(i) => i + 1, // In reverse mode, index points one past the next element. Some(i) => i + 1, // In reverse mode, index points one past the next element.
None => 0 None => 0
} }
@ -361,7 +367,7 @@ impl<'a> TextRun {
/// Returns an iterator that will iterate over all slices of glyphs that represent individual /// Returns an iterator that will iterate over all slices of glyphs that represent individual
/// characters in the given range. /// characters in the given range.
pub fn character_slices_in_range(&'a self, range: &Range<CharIndex>) pub fn character_slices_in_range(&'a self, range: &Range<ByteIndex>)
-> CharacterSliceIterator<'a> { -> CharacterSliceIterator<'a> {
let index = match self.index_of_first_glyph_run_containing(range.begin()) { let index = match self.index_of_first_glyph_run_containing(range.begin()) {
None => self.glyphs.len(), None => self.glyphs.len(),
@ -370,6 +376,7 @@ impl<'a> TextRun {
let mut glyph_run_iter = self.glyphs[index..].iter(); let mut glyph_run_iter = self.glyphs[index..].iter();
let first_glyph_run = glyph_run_iter.next(); let first_glyph_run = glyph_run_iter.next();
CharacterSliceIterator { CharacterSliceIterator {
text: &self.text,
glyph_run: first_glyph_run, glyph_run: first_glyph_run,
glyph_run_iter: glyph_run_iter, glyph_run_iter: glyph_run_iter,
range: *range, range: *range,

View file

@ -31,7 +31,7 @@ use gfx::display_list::{LineDisplayItem, OpaqueNode, SolidColorDisplayItem};
use gfx::display_list::{StackingContext, StackingContextId, StackingContextType}; use gfx::display_list::{StackingContext, StackingContextId, StackingContextType};
use gfx::display_list::{TextDisplayItem, TextOrientation, WebRenderImageInfo}; use gfx::display_list::{TextDisplayItem, TextOrientation, WebRenderImageInfo};
use gfx::paint_thread::THREAD_TINT_COLORS; use gfx::paint_thread::THREAD_TINT_COLORS;
use gfx::text::glyph::CharIndex; use gfx::text::glyph::ByteIndex;
use gfx_traits::{color, ScrollPolicy}; use gfx_traits::{color, ScrollPolicy};
use inline::{FIRST_FRAGMENT_OF_ELEMENT, InlineFlow, LAST_FRAGMENT_OF_ELEMENT}; use inline::{FIRST_FRAGMENT_OF_ELEMENT, InlineFlow, LAST_FRAGMENT_OF_ELEMENT};
use ipc_channel::ipc::{self, IpcSharedMemory}; use ipc_channel::ipc::{self, IpcSharedMemory};
@ -965,7 +965,7 @@ impl FragmentDisplayListBuilding for Fragment {
Some(insertion_point_index) => insertion_point_index, Some(insertion_point_index) => insertion_point_index,
None => return, None => return,
}; };
let range = Range::new(CharIndex(0), insertion_point_index); let range = Range::new(ByteIndex(0), insertion_point_index);
let advance = scanned_text_fragment_info.run.advance_for_range(&range); let advance = scanned_text_fragment_info.run.advance_for_range(&range);
let insertion_point_bounds; let insertion_point_bounds;

View file

@ -15,7 +15,7 @@ use flow::{self, Flow};
use flow_ref::{self, FlowRef}; use flow_ref::{self, FlowRef};
use gfx; use gfx;
use gfx::display_list::{BLUR_INFLATION_FACTOR, FragmentType, OpaqueNode, StackingContextId}; use gfx::display_list::{BLUR_INFLATION_FACTOR, FragmentType, OpaqueNode, StackingContextId};
use gfx::text::glyph::CharIndex; use gfx::text::glyph::ByteIndex;
use gfx::text::text_run::{TextRun, TextRunSlice}; use gfx::text::text_run::{TextRun, TextRunSlice};
use gfx_traits::{LayerId, LayerType}; use gfx_traits::{LayerId, LayerType};
use incremental::{RECONSTRUCT_FLOW, RestyleDamage}; use incremental::{RECONSTRUCT_FLOW, RestyleDamage};
@ -48,7 +48,6 @@ use text;
use text::TextRunScanner; use text::TextRunScanner;
use url::Url; use url::Url;
use util; use util;
use util::str::slice_chars;
use wrapper::{PseudoElementType, ThreadSafeLayoutElement, ThreadSafeLayoutNode}; use wrapper::{PseudoElementType, ThreadSafeLayoutElement, ThreadSafeLayoutNode};
/// Fragments (`struct Fragment`) are the leaves of the layout tree. They cannot position /// Fragments (`struct Fragment`) are the leaves of the layout tree. They cannot position
@ -227,13 +226,8 @@ impl SpecificFragmentInfo {
impl fmt::Debug for SpecificFragmentInfo { impl fmt::Debug for SpecificFragmentInfo {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
match *self { match *self {
SpecificFragmentInfo::ScannedText(ref info) => { SpecificFragmentInfo::ScannedText(ref info) => write!(f, "{:?}", info.text()),
write!(f, "{:?}", slice_chars(&*info.run.text, info.range.begin().get() as usize, SpecificFragmentInfo::UnscannedText(ref info) => write!(f, "{:?}", info.text),
info.range.end().get() as usize))
}
SpecificFragmentInfo::UnscannedText(ref info) => {
write!(f, "{:?}", info.text)
}
_ => Ok(()) _ => Ok(())
} }
} }
@ -657,16 +651,16 @@ pub struct ScannedTextFragmentInfo {
/// The intrinsic size of the text fragment. /// The intrinsic size of the text fragment.
pub content_size: LogicalSize<Au>, pub content_size: LogicalSize<Au>,
/// The position of the insertion point in characters, if any. /// The byte offset of the insertion point, if any.
pub insertion_point: Option<CharIndex>, pub insertion_point: Option<ByteIndex>,
/// The range within the above text run that this represents. /// The range within the above text run that this represents.
pub range: Range<CharIndex>, pub range: Range<ByteIndex>,
/// The endpoint of the above range, including whitespace that was stripped out. This exists /// The endpoint of the above range, including whitespace that was stripped out. This exists
/// so that we can restore the range to its original value (before line breaking occurred) when /// so that we can restore the range to its original value (before line breaking occurred) when
/// performing incremental reflow. /// performing incremental reflow.
pub range_end_including_stripped_whitespace: CharIndex, pub range_end_including_stripped_whitespace: ByteIndex,
pub flags: ScannedTextFlags, pub flags: ScannedTextFlags,
} }
@ -685,9 +679,9 @@ bitflags! {
impl ScannedTextFragmentInfo { impl ScannedTextFragmentInfo {
/// Creates the information specific to a scanned text fragment from a range and a text run. /// Creates the information specific to a scanned text fragment from a range and a text run.
pub fn new(run: Arc<TextRun>, pub fn new(run: Arc<TextRun>,
range: Range<CharIndex>, range: Range<ByteIndex>,
content_size: LogicalSize<Au>, content_size: LogicalSize<Au>,
insertion_point: Option<CharIndex>, insertion_point: Option<ByteIndex>,
flags: ScannedTextFlags) flags: ScannedTextFlags)
-> ScannedTextFragmentInfo { -> ScannedTextFragmentInfo {
ScannedTextFragmentInfo { ScannedTextFragmentInfo {
@ -700,6 +694,10 @@ impl ScannedTextFragmentInfo {
} }
} }
pub fn text(&self) -> &str {
&self.run.text[self.range.begin().to_usize() .. self.range.end().to_usize()]
}
pub fn requires_line_break_afterward_if_wrapping_on_newlines(&self) -> bool { pub fn requires_line_break_afterward_if_wrapping_on_newlines(&self) -> bool {
self.flags.contains(REQUIRES_LINE_BREAK_AFTERWARD_IF_WRAPPING_ON_NEWLINES) self.flags.contains(REQUIRES_LINE_BREAK_AFTERWARD_IF_WRAPPING_ON_NEWLINES)
} }
@ -715,12 +713,12 @@ impl ScannedTextFragmentInfo {
pub struct SplitInfo { pub struct SplitInfo {
// TODO(bjz): this should only need to be a single character index, but both values are // TODO(bjz): this should only need to be a single character index, but both values are
// currently needed for splitting in the `inline::try_append_*` functions. // currently needed for splitting in the `inline::try_append_*` functions.
pub range: Range<CharIndex>, pub range: Range<ByteIndex>,
pub inline_size: Au, pub inline_size: Au,
} }
impl SplitInfo { impl SplitInfo {
fn new(range: Range<CharIndex>, info: &ScannedTextFragmentInfo) -> SplitInfo { fn new(range: Range<ByteIndex>, info: &ScannedTextFragmentInfo) -> SplitInfo {
let inline_size = info.run.advance_for_range(&range); let inline_size = info.run.advance_for_range(&range);
SplitInfo { SplitInfo {
range: range, range: range,
@ -755,13 +753,13 @@ pub struct UnscannedTextFragmentInfo {
pub text: Box<str>, pub text: Box<str>,
/// The selected text range. An empty range represents the insertion point. /// The selected text range. An empty range represents the insertion point.
pub selection: Option<Range<CharIndex>>, pub selection: Option<Range<ByteIndex>>,
} }
impl UnscannedTextFragmentInfo { impl UnscannedTextFragmentInfo {
/// Creates a new instance of `UnscannedTextFragmentInfo` from the given text. /// Creates a new instance of `UnscannedTextFragmentInfo` from the given text.
#[inline] #[inline]
pub fn new(text: String, selection: Option<Range<CharIndex>>) -> UnscannedTextFragmentInfo { pub fn new(text: String, selection: Option<Range<ByteIndex>>) -> UnscannedTextFragmentInfo {
UnscannedTextFragmentInfo { UnscannedTextFragmentInfo {
text: text.into_boxed_str(), text: text.into_boxed_str(),
selection: selection, selection: selection,
@ -1611,7 +1609,7 @@ impl Fragment {
}; };
let mut remaining_inline_size = max_inline_size; let mut remaining_inline_size = max_inline_size;
let mut inline_start_range = Range::new(text_fragment_info.range.begin(), CharIndex(0)); let mut inline_start_range = Range::new(text_fragment_info.range.begin(), ByteIndex(0));
let mut inline_end_range = None; let mut inline_end_range = None;
let mut overflowing = false; let mut overflowing = false;
@ -1651,7 +1649,7 @@ impl Fragment {
// We're going to overflow the line. // We're going to overflow the line.
overflowing = true; overflowing = true;
inline_start_range = slice.text_run_range(); inline_start_range = slice.text_run_range();
remaining_range = Range::new(slice.text_run_range().end(), CharIndex(0)); remaining_range = Range::new(slice.text_run_range().end(), ByteIndex(0));
remaining_range.extend_to(text_fragment_info.range.end()); remaining_range.extend_to(text_fragment_info.range.end());
} }
@ -2322,32 +2320,20 @@ impl Fragment {
match self.specific { match self.specific {
SpecificFragmentInfo::ScannedText(ref mut scanned_text_fragment_info) => { SpecificFragmentInfo::ScannedText(ref mut scanned_text_fragment_info) => {
let mut leading_whitespace_character_count = 0; let leading_whitespace_byte_count = scanned_text_fragment_info.text()
{ .find(|c| !util::str::char_is_whitespace(c))
let text = slice_chars( .unwrap_or(scanned_text_fragment_info.text().len());
&*scanned_text_fragment_info.run.text,
scanned_text_fragment_info.range.begin().to_usize(),
scanned_text_fragment_info.range.end().to_usize());
for character in text.chars() {
if util::str::char_is_whitespace(character) {
leading_whitespace_character_count += 1
} else {
break
}
}
}
let whitespace_len = ByteIndex(leading_whitespace_byte_count as isize);
let whitespace_range = Range::new(scanned_text_fragment_info.range.begin(), let whitespace_range = Range::new(scanned_text_fragment_info.range.begin(),
CharIndex(leading_whitespace_character_count)); whitespace_len);
let text_bounds = let text_bounds =
scanned_text_fragment_info.run.metrics_for_range(&whitespace_range).bounding_box; scanned_text_fragment_info.run.metrics_for_range(&whitespace_range).bounding_box;
self.border_box.size.inline = self.border_box.size.inline - text_bounds.size.width; self.border_box.size.inline = self.border_box.size.inline - text_bounds.size.width;
scanned_text_fragment_info.content_size.inline = scanned_text_fragment_info.content_size.inline =
scanned_text_fragment_info.content_size.inline - text_bounds.size.width; scanned_text_fragment_info.content_size.inline - text_bounds.size.width;
scanned_text_fragment_info.range.adjust_by( scanned_text_fragment_info.range.adjust_by(whitespace_len, -whitespace_len);
CharIndex(leading_whitespace_character_count),
-CharIndex(leading_whitespace_character_count));
WhitespaceStrippingResult::RetainFragment WhitespaceStrippingResult::RetainFragment
} }
@ -2388,43 +2374,29 @@ impl Fragment {
match self.specific { match self.specific {
SpecificFragmentInfo::ScannedText(ref mut scanned_text_fragment_info) => { SpecificFragmentInfo::ScannedText(ref mut scanned_text_fragment_info) => {
// FIXME(pcwalton): Is there a more clever (i.e. faster) way to do this? let mut trailing_whitespace_start_byte = 0;
debug!("stripping trailing whitespace: range={:?}, len={}", for (i, c) in scanned_text_fragment_info.text().char_indices().rev() {
scanned_text_fragment_info.range, if !util::str::char_is_whitespace(c) {
scanned_text_fragment_info.run.text.chars().count()); trailing_whitespace_start_byte = i + c.len_utf8();
let mut trailing_whitespace_character_count = 0; break;
let text_bounds;
{
let text = slice_chars(&*scanned_text_fragment_info.run.text,
scanned_text_fragment_info.range.begin().to_usize(),
scanned_text_fragment_info.range.end().to_usize());
for ch in text.chars().rev() {
if util::str::char_is_whitespace(ch) {
trailing_whitespace_character_count += 1
} else {
break
}
} }
let whitespace_range =
Range::new(scanned_text_fragment_info.range.end() -
CharIndex(trailing_whitespace_character_count),
CharIndex(trailing_whitespace_character_count));
text_bounds = scanned_text_fragment_info.run
.metrics_for_range(&whitespace_range)
.bounding_box;
self.border_box.size.inline = self.border_box.size.inline -
text_bounds.size.width;
} }
let whitespace_start = ByteIndex(trailing_whitespace_start_byte as isize);
let whitespace_len = scanned_text_fragment_info.range.length() - whitespace_start;
let whitespace_range = Range::new(whitespace_start, whitespace_len);
// FIXME: This may be unnecessary because these metrics will be recomputed in
// LineBreaker::strip_trailing_whitespace_from_pending_line_if_necessary
let text_bounds = scanned_text_fragment_info.run
.metrics_for_range(&whitespace_range)
.bounding_box;
self.border_box.size.inline = self.border_box.size.inline -
text_bounds.size.width;
scanned_text_fragment_info.content_size.inline = scanned_text_fragment_info.content_size.inline =
scanned_text_fragment_info.content_size.inline - text_bounds.size.width; scanned_text_fragment_info.content_size.inline - text_bounds.size.width;
if trailing_whitespace_character_count != 0 { scanned_text_fragment_info.range.extend_by(-whitespace_len);
scanned_text_fragment_info.range.extend_by(
CharIndex(-trailing_whitespace_character_count));
}
WhitespaceStrippingResult::RetainFragment WhitespaceStrippingResult::RetainFragment
} }
SpecificFragmentInfo::UnscannedText(ref mut unscanned_text_fragment_info) => { SpecificFragmentInfo::UnscannedText(ref mut unscanned_text_fragment_info) => {

View file

@ -12,7 +12,7 @@ use fragment::{ScannedTextFragmentInfo, SELECTED, SpecificFragmentInfo, Unscanne
use gfx::font::{DISABLE_KERNING_SHAPING_FLAG, FontMetrics, IGNORE_LIGATURES_SHAPING_FLAG}; use gfx::font::{DISABLE_KERNING_SHAPING_FLAG, FontMetrics, IGNORE_LIGATURES_SHAPING_FLAG};
use gfx::font::{RTL_FLAG, RunMetrics, ShapingFlags, ShapingOptions}; use gfx::font::{RTL_FLAG, RunMetrics, ShapingFlags, ShapingOptions};
use gfx::font_context::FontContext; use gfx::font_context::FontContext;
use gfx::text::glyph::CharIndex; use gfx::text::glyph::ByteIndex;
use gfx::text::text_run::TextRun; use gfx::text::text_run::TextRun;
use gfx::text::util::{self, CompressionMode}; use gfx::text::util::{self, CompressionMode};
use inline::{FIRST_FRAGMENT_OF_ELEMENT, InlineFragments, LAST_FRAGMENT_OF_ELEMENT}; use inline::{FIRST_FRAGMENT_OF_ELEMENT, InlineFragments, LAST_FRAGMENT_OF_ELEMENT};
@ -174,7 +174,7 @@ impl TextRunScanner {
for (fragment_index, in_fragment) in self.clump.iter().enumerate() { for (fragment_index, in_fragment) in self.clump.iter().enumerate() {
debug!(" flushing {:?}", in_fragment); debug!(" flushing {:?}", in_fragment);
let mut mapping = RunMapping::new(&run_info_list[..], &run_info, fragment_index); let mut mapping = RunMapping::new(&run_info_list[..], fragment_index);
let text; let text;
let selection; let selection;
match in_fragment.specific { match in_fragment.specific {
@ -188,13 +188,13 @@ impl TextRunScanner {
Some(range) if range.is_empty() => { Some(range) if range.is_empty() => {
// `range` is the range within the current fragment. To get the range // `range` is the range within the current fragment. To get the range
// within the text run, offset it by the length of the preceding fragments. // within the text run, offset it by the length of the preceding fragments.
Some(range.begin() + CharIndex(run_info.character_length as isize)) Some(range.begin() + ByteIndex(run_info.text.len() as isize))
} }
_ => None _ => None
}; };
let (mut start_position, mut end_position) = (0, 0); let (mut start_position, mut end_position) = (0, 0);
for (char_index, character) in text.chars().enumerate() { for (byte_index, character) in text.char_indices() {
// Search for the first font in this font group that contains a glyph for this // Search for the first font in this font group that contains a glyph for this
// character. // character.
let mut font_index = 0; let mut font_index = 0;
@ -226,7 +226,7 @@ impl TextRunScanner {
} }
let selected = match selection { let selected = match selection {
Some(range) => range.contains(CharIndex(char_index as isize)), Some(range) => range.contains(ByteIndex(byte_index as isize)),
None => false None => false
}; };
@ -251,7 +251,6 @@ impl TextRunScanner {
run_info = RunInfo::new(); run_info = RunInfo::new();
} }
mapping = RunMapping::new(&run_info_list[..], mapping = RunMapping::new(&run_info_list[..],
&run_info,
fragment_index); fragment_index);
} }
run_info.font_index = font_index; run_info.font_index = font_index;
@ -343,11 +342,14 @@ impl TextRunScanner {
let mut mapping = mappings.next().unwrap(); let mut mapping = mappings.next().unwrap();
let scanned_run = runs[mapping.text_run_index].clone(); let scanned_run = runs[mapping.text_run_index].clone();
let mut byte_range = Range::new(ByteIndex(mapping.byte_range.begin() as isize),
ByteIndex(mapping.byte_range.length() as isize));
let requires_line_break_afterward_if_wrapping_on_newlines = let requires_line_break_afterward_if_wrapping_on_newlines =
!mapping.byte_range.is_empty() && !mapping.byte_range.is_empty() &&
scanned_run.run.text.char_at_reverse(mapping.byte_range.end()) == '\n'; scanned_run.run.text.char_at_reverse(mapping.byte_range.end()) == '\n';
if requires_line_break_afterward_if_wrapping_on_newlines { if requires_line_break_afterward_if_wrapping_on_newlines {
mapping.char_range.extend_by(CharIndex(-1)); byte_range.extend_by(ByteIndex(-1)); // Trim the '\n'
} }
let text_size = old_fragment.border_box.size; let text_size = old_fragment.border_box.size;
@ -368,12 +370,12 @@ impl TextRunScanner {
let mut new_text_fragment_info = box ScannedTextFragmentInfo::new( let mut new_text_fragment_info = box ScannedTextFragmentInfo::new(
scanned_run.run, scanned_run.run,
mapping.char_range, byte_range,
text_size, text_size,
insertion_point, insertion_point,
flags); flags);
let new_metrics = new_text_fragment_info.run.metrics_for_range(&mapping.char_range); let new_metrics = new_text_fragment_info.run.metrics_for_range(&byte_range);
let writing_mode = old_fragment.style.writing_mode; let writing_mode = old_fragment.style.writing_mode;
let bounding_box_size = bounding_box_for_run_metrics(&new_metrics, writing_mode); let bounding_box_size = bounding_box_for_run_metrics(&new_metrics, writing_mode);
new_text_fragment_info.content_size = bounding_box_size; new_text_fragment_info.content_size = bounding_box_size;
@ -490,7 +492,7 @@ fn split_first_fragment_at_newline_if_necessary(fragments: &mut LinkedList<Fragm
unscanned_text_fragment_info.text[..(position + 1)].to_owned(); unscanned_text_fragment_info.text[..(position + 1)].to_owned();
unscanned_text_fragment_info.text = unscanned_text_fragment_info.text =
unscanned_text_fragment_info.text[(position + 1)..].to_owned().into_boxed_str(); unscanned_text_fragment_info.text[(position + 1)..].to_owned().into_boxed_str();
let offset = CharIndex(string_before.char_indices().count() as isize); let offset = ByteIndex(string_before.len() as isize);
match unscanned_text_fragment_info.selection { match unscanned_text_fragment_info.selection {
Some(ref mut selection) if selection.begin() >= offset => { Some(ref mut selection) if selection.begin() >= offset => {
// Selection is entirely in the second fragment. // Selection is entirely in the second fragment.
@ -500,7 +502,7 @@ fn split_first_fragment_at_newline_if_necessary(fragments: &mut LinkedList<Fragm
Some(ref mut selection) if selection.end() > offset => { Some(ref mut selection) if selection.end() > offset => {
// Selection is split across two fragments. // Selection is split across two fragments.
selection_before = Some(Range::new(selection.begin(), offset)); selection_before = Some(Range::new(selection.begin(), offset));
*selection = Range::new(CharIndex(0), selection.end() - offset); *selection = Range::new(ByteIndex(0), selection.end() - offset);
} }
_ => { _ => {
// Selection is entirely in the first fragment. // Selection is entirely in the first fragment.
@ -523,11 +525,9 @@ struct RunInfo {
/// The text that will go in this text run. /// The text that will go in this text run.
text: String, text: String,
/// The insertion point in this text run, if applicable. /// The insertion point in this text run, if applicable.
insertion_point: Option<CharIndex>, insertion_point: Option<ByteIndex>,
/// The index of the applicable font in the font group. /// The index of the applicable font in the font group.
font_index: usize, font_index: usize,
/// A cached copy of the number of Unicode characters in the text run.
character_length: usize,
/// The bidirection embedding level of this text run. /// The bidirection embedding level of this text run.
bidi_level: u8, bidi_level: u8,
/// The Unicode script property of this text run. /// The Unicode script property of this text run.
@ -540,7 +540,6 @@ impl RunInfo {
text: String::new(), text: String::new(),
insertion_point: None, insertion_point: None,
font_index: 0, font_index: 0,
character_length: 0,
bidi_level: 0, bidi_level: 0,
script: Script::Common, script: Script::Common,
} }
@ -552,9 +551,9 @@ impl RunInfo {
/// of this text run. /// of this text run.
fn flush(mut self, fn flush(mut self,
list: &mut Vec<RunInfo>, list: &mut Vec<RunInfo>,
insertion_point: &mut Option<CharIndex>) { insertion_point: &mut Option<ByteIndex>) {
if let Some(idx) = *insertion_point { if let Some(idx) = *insertion_point {
let char_len = CharIndex(self.character_length as isize); let char_len = ByteIndex(self.text.len() as isize);
if idx <= char_len { if idx <= char_len {
// The insertion point is in this text run. // The insertion point is in this text run.
self.insertion_point = insertion_point.take() self.insertion_point = insertion_point.take()
@ -571,8 +570,6 @@ impl RunInfo {
/// for it. /// for it.
#[derive(Copy, Clone, Debug)] #[derive(Copy, Clone, Debug)]
struct RunMapping { struct RunMapping {
/// The range of characters within the text fragment.
char_range: Range<CharIndex>,
/// The range of byte indices within the text fragment. /// The range of byte indices within the text fragment.
byte_range: Range<usize>, byte_range: Range<usize>,
/// The index of the unscanned text fragment that this mapping corresponds to. /// The index of the unscanned text fragment that this mapping corresponds to.
@ -585,13 +582,10 @@ struct RunMapping {
impl RunMapping { impl RunMapping {
/// Given the current set of text runs, creates a run mapping for the next fragment. /// Given the current set of text runs, creates a run mapping for the next fragment.
/// `run_info_list` describes the set of runs we've seen already, and `current_run_info` /// `run_info_list` describes the set of runs we've seen already.
/// describes the run we just finished processing. fn new(run_info_list: &[RunInfo], fragment_index: usize)
fn new(run_info_list: &[RunInfo], current_run_info: &RunInfo, fragment_index: usize)
-> RunMapping { -> RunMapping {
RunMapping { RunMapping {
char_range: Range::new(CharIndex(current_run_info.character_length as isize),
CharIndex(0)),
byte_range: Range::new(0, 0), byte_range: Range::new(0, 0),
old_fragment_index: fragment_index, old_fragment_index: fragment_index,
text_run_index: run_info_list.len(), text_run_index: run_info_list.len(),
@ -620,26 +614,21 @@ impl RunMapping {
// Account for `text-transform`. (Confusingly, this is not handled in "text // Account for `text-transform`. (Confusingly, this is not handled in "text
// transformation" above, but we follow Gecko in the naming.) // transformation" above, but we follow Gecko in the naming.)
let is_first_run = *start_position == 0; let is_first_run = *start_position == 0;
let character_count = apply_style_transform_if_necessary(&mut run_info.text, apply_style_transform_if_necessary(&mut run_info.text, old_byte_length, text_transform,
old_byte_length, *last_whitespace, is_first_run);
text_transform,
*last_whitespace,
is_first_run);
run_info.character_length = run_info.character_length + character_count;
*start_position = end_position; *start_position = end_position;
let new_byte_length = run_info.text.len();
let is_empty = new_byte_length == old_byte_length;
// Don't save mappings that contain only discarded characters. // Don't save mappings that contain only discarded characters.
// (But keep ones that contained no characters to begin with, since they might have been // (But keep ones that contained no characters to begin with, since they might have been
// generated by an empty flow to draw its borders/padding/insertion point.) // generated by an empty flow to draw its borders/padding/insertion point.)
let is_empty = character_count == 0;
if is_empty && !was_empty { if is_empty && !was_empty {
return; return;
} }
let new_byte_length = run_info.text.len();
self.byte_range = Range::new(old_byte_length, new_byte_length - old_byte_length); self.byte_range = Range::new(old_byte_length, new_byte_length - old_byte_length);
self.char_range.extend_by(CharIndex(character_count as isize));
mappings.push(self) mappings.push(self)
} }
@ -648,10 +637,10 @@ impl RunMapping {
/// NOTE: We treat the range as inclusive at both ends, since the insertion point can lie /// NOTE: We treat the range as inclusive at both ends, since the insertion point can lie
/// before the first character *or* after the last character, and should be drawn even if the /// before the first character *or* after the last character, and should be drawn even if the
/// text is empty. /// text is empty.
fn contains_insertion_point(&self, insertion_point: Option<CharIndex>) -> bool { fn contains_insertion_point(&self, insertion_point: Option<ByteIndex>) -> bool {
match insertion_point { match insertion_point.map(ByteIndex::to_usize) {
None => false, None => false,
Some(idx) => self.char_range.begin() <= idx && idx <= self.char_range.end() Some(idx) => self.byte_range.begin() <= idx && idx <= self.byte_range.end()
} }
} }
} }
@ -666,39 +655,29 @@ fn apply_style_transform_if_necessary(string: &mut String,
first_character_position: usize, first_character_position: usize,
text_transform: text_transform::T, text_transform: text_transform::T,
last_whitespace: bool, last_whitespace: bool,
is_first_run: bool) is_first_run: bool) {
-> usize {
match text_transform { match text_transform {
text_transform::T::none => string[first_character_position..].chars().count(), text_transform::T::none => {}
text_transform::T::uppercase => { text_transform::T::uppercase => {
let original = string[first_character_position..].to_owned(); let original = string[first_character_position..].to_owned();
string.truncate(first_character_position); string.truncate(first_character_position);
let mut count = 0;
for ch in original.chars().flat_map(|ch| ch.to_uppercase()) { for ch in original.chars().flat_map(|ch| ch.to_uppercase()) {
string.push(ch); string.push(ch);
count += 1;
} }
count
} }
text_transform::T::lowercase => { text_transform::T::lowercase => {
let original = string[first_character_position..].to_owned(); let original = string[first_character_position..].to_owned();
string.truncate(first_character_position); string.truncate(first_character_position);
let mut count = 0;
for ch in original.chars().flat_map(|ch| ch.to_lowercase()) { for ch in original.chars().flat_map(|ch| ch.to_lowercase()) {
string.push(ch); string.push(ch);
count += 1;
} }
count
} }
text_transform::T::capitalize => { text_transform::T::capitalize => {
let original = string[first_character_position..].to_owned(); let original = string[first_character_position..].to_owned();
string.truncate(first_character_position); string.truncate(first_character_position);
let mut capitalize_next_letter = is_first_run || last_whitespace; let mut capitalize_next_letter = is_first_run || last_whitespace;
let mut count = 0;
for character in original.chars() { for character in original.chars() {
count += 1;
// FIXME(#4311, pcwalton): Should be the CSS/Unicode notion of a *typographic // FIXME(#4311, pcwalton): Should be the CSS/Unicode notion of a *typographic
// letter unit*, not an *alphabetic* character: // letter unit*, not an *alphabetic* character:
// //
@ -716,8 +695,6 @@ fn apply_style_transform_if_necessary(string: &mut String,
capitalize_next_letter = true capitalize_next_letter = true
} }
} }
count
} }
} }
} }
@ -725,7 +702,7 @@ fn apply_style_transform_if_necessary(string: &mut String,
#[derive(Clone)] #[derive(Clone)]
struct ScannedTextRun { struct ScannedTextRun {
run: Arc<TextRun>, run: Arc<TextRun>,
insertion_point: Option<CharIndex>, insertion_point: Option<ByteIndex>,
} }
/// Can a character with script `b` continue a text run with script `a`? /// Can a character with script `b` continue a text run with script `a`?

View file

@ -392,7 +392,7 @@ impl WebRenderDisplayItemConverter for DisplayItem {
let mut glyphs = vec!(); let mut glyphs = vec!();
for slice in item.text_run.natural_word_slices_in_visual_order(&item.range) { for slice in item.text_run.natural_word_slices_in_visual_order(&item.range) {
for glyph in slice.glyphs.iter_glyphs_for_char_range(&slice.range) { for glyph in slice.glyphs.iter_glyphs_for_byte_range(&slice.range) {
let glyph_advance = glyph.advance(); let glyph_advance = glyph.advance();
let glyph_offset = glyph.offset().unwrap_or(Point2D::zero()); let glyph_offset = glyph.offset().unwrap_or(Point2D::zero());
let glyph = webrender_traits::GlyphInstance { let glyph = webrender_traits::GlyphInstance {

View file

@ -33,7 +33,7 @@
use core::nonzero::NonZero; use core::nonzero::NonZero;
use data::{LayoutDataFlags, PrivateLayoutData}; use data::{LayoutDataFlags, PrivateLayoutData};
use gfx::display_list::OpaqueNode; use gfx::display_list::OpaqueNode;
use gfx::text::glyph::CharIndex; use gfx::text::glyph::ByteIndex;
use gfx_traits::{LayerId, LayerType}; use gfx_traits::{LayerId, LayerType};
use incremental::RestyleDamage; use incremental::RestyleDamage;
use msg::constellation_msg::PipelineId; use msg::constellation_msg::PipelineId;
@ -74,7 +74,7 @@ use style::restyle_hints::ElementSnapshot;
use style::selector_impl::{NonTSPseudoClass, PseudoElement, ServoSelectorImpl}; use style::selector_impl::{NonTSPseudoClass, PseudoElement, ServoSelectorImpl};
use style::servo::PrivateStyleData; use style::servo::PrivateStyleData;
use url::Url; use url::Url;
use util::str::{is_whitespace, search_index}; use util::str::is_whitespace;
pub type NonOpaqueStyleAndLayoutData = *mut RefCell<PrivateLayoutData>; pub type NonOpaqueStyleAndLayoutData = *mut RefCell<PrivateLayoutData>;
@ -838,7 +838,7 @@ pub trait ThreadSafeLayoutNode : Clone + Copy + Sized + PartialEq {
fn text_content(&self) -> TextContent; fn text_content(&self) -> TextContent;
/// If the insertion point is within this node, returns it. Otherwise, returns `None`. /// If the insertion point is within this node, returns it. Otherwise, returns `None`.
fn selection(&self) -> Option<Range<CharIndex>>; fn selection(&self) -> Option<Range<ByteIndex>>;
/// If this is an image element, returns its URL. If this is not an image element, fails. /// If this is an image element, returns its URL. If this is not an image element, fails.
/// ///
@ -1077,27 +1077,18 @@ impl<'ln> ThreadSafeLayoutNode for ServoThreadSafeLayoutNode<'ln> {
panic!("not text!") panic!("not text!")
} }
fn selection(&self) -> Option<Range<CharIndex>> { fn selection(&self) -> Option<Range<ByteIndex>> {
let this = unsafe { let this = unsafe { self.get_jsmanaged() };
self.get_jsmanaged()
};
if let Some(area) = this.downcast::<HTMLTextAreaElement>() { let selection = if let Some(area) = this.downcast::<HTMLTextAreaElement>() {
if let Some(selection) = unsafe { area.get_absolute_selection_for_layout() } { unsafe { area.selection_for_layout() }
let text = unsafe { area.get_value_for_layout() }; } else if let Some(input) = this.downcast::<HTMLInputElement>() {
let begin_byte = selection.begin(); unsafe { input.selection_for_layout() }
let begin = search_index(begin_byte, text.char_indices()); } else {
let length = search_index(selection.length(), text[begin_byte..].char_indices()); return None;
return Some(Range::new(CharIndex(begin), CharIndex(length))); };
} selection.map(|range| Range::new(ByteIndex(range.begin() as isize),
} ByteIndex(range.length() as isize)))
if let Some(input) = this.downcast::<HTMLInputElement>() {
if let Some(selection) = unsafe { input.selection_for_layout() } {
return Some(Range::new(CharIndex(selection.begin()),
CharIndex(selection.length())));
}
}
None
} }
fn image_url(&self) -> Option<Url> { fn image_url(&self) -> Option<Url> {

View file

@ -43,10 +43,11 @@ use style::element_state::*;
use textinput::KeyReaction::{DispatchInput, Nothing, RedrawSelection, TriggerDefaultAction}; use textinput::KeyReaction::{DispatchInput, Nothing, RedrawSelection, TriggerDefaultAction};
use textinput::Lines::Single; use textinput::Lines::Single;
use textinput::{TextInput, SelectionDirection}; use textinput::{TextInput, SelectionDirection};
use util::str::{DOMString, search_index}; use util::str::{DOMString};
const DEFAULT_SUBMIT_VALUE: &'static str = "Submit"; const DEFAULT_SUBMIT_VALUE: &'static str = "Submit";
const DEFAULT_RESET_VALUE: &'static str = "Reset"; const DEFAULT_RESET_VALUE: &'static str = "Reset";
const PASSWORD_REPLACEMENT_CHAR: char = '●';
#[derive(JSTraceable, PartialEq, Copy, Clone)] #[derive(JSTraceable, PartialEq, Copy, Clone)]
#[allow(dead_code)] #[allow(dead_code)]
@ -174,7 +175,7 @@ pub trait LayoutHTMLInputElementHelpers {
#[allow(unsafe_code)] #[allow(unsafe_code)]
unsafe fn size_for_layout(self) -> u32; unsafe fn size_for_layout(self) -> u32;
#[allow(unsafe_code)] #[allow(unsafe_code)]
unsafe fn selection_for_layout(self) -> Option<Range<isize>>; unsafe fn selection_for_layout(self) -> Option<Range<usize>>;
#[allow(unsafe_code)] #[allow(unsafe_code)]
unsafe fn checked_state_for_layout(self) -> bool; unsafe fn checked_state_for_layout(self) -> bool;
#[allow(unsafe_code)] #[allow(unsafe_code)]
@ -207,8 +208,7 @@ impl LayoutHTMLInputElementHelpers for LayoutJS<HTMLInputElement> {
InputType::InputPassword => { InputType::InputPassword => {
let text = get_raw_textinput_value(self); let text = get_raw_textinput_value(self);
if !text.is_empty() { if !text.is_empty() {
// The implementation of selection_for_layout expects a 1:1 mapping of chars. text.chars().map(|_| PASSWORD_REPLACEMENT_CHAR).collect()
text.chars().map(|_| '●').collect()
} else { } else {
String::from((*self.unsafe_get()).placeholder.borrow_for_layout().clone()) String::from((*self.unsafe_get()).placeholder.borrow_for_layout().clone())
} }
@ -216,7 +216,6 @@ impl LayoutHTMLInputElementHelpers for LayoutJS<HTMLInputElement> {
_ => { _ => {
let text = get_raw_textinput_value(self); let text = get_raw_textinput_value(self);
if !text.is_empty() { if !text.is_empty() {
// The implementation of selection_for_layout expects a 1:1 mapping of chars.
String::from(text) String::from(text)
} else { } else {
String::from((*self.unsafe_get()).placeholder.borrow_for_layout().clone()) String::from((*self.unsafe_get()).placeholder.borrow_for_layout().clone())
@ -233,24 +232,29 @@ impl LayoutHTMLInputElementHelpers for LayoutJS<HTMLInputElement> {
#[allow(unrooted_must_root)] #[allow(unrooted_must_root)]
#[allow(unsafe_code)] #[allow(unsafe_code)]
unsafe fn selection_for_layout(self) -> Option<Range<isize>> { unsafe fn selection_for_layout(self) -> Option<Range<usize>> {
if !(*self.unsafe_get()).upcast::<Element>().focus_state() { if !(*self.unsafe_get()).upcast::<Element>().focus_state() {
return None; return None;
} }
// Use the raw textinput to get the index as long as we use a 1:1 char mapping
// in value_for_layout.
let raw = match (*self.unsafe_get()).input_type.get() {
InputType::InputText |
InputType::InputPassword => get_raw_textinput_value(self),
_ => return None
};
let textinput = (*self.unsafe_get()).textinput.borrow_for_layout(); let textinput = (*self.unsafe_get()).textinput.borrow_for_layout();
let selection = textinput.get_absolute_selection_range();
let begin_byte = selection.begin(); match (*self.unsafe_get()).input_type.get() {
let begin = search_index(begin_byte, raw.char_indices()); InputType::InputPassword => {
let length = search_index(selection.length(), raw[begin_byte..].char_indices()); let text = get_raw_textinput_value(self);
Some(Range::new(begin, length)) let sel = textinput.get_absolute_selection_range();
// Translate indices from the raw value to indices in the replacement value.
let char_start = text[.. sel.begin()].chars().count();
let char_count = text[sel.begin() .. sel.end()].chars().count();
let bytes_per_char = PASSWORD_REPLACEMENT_CHAR.len_utf8();
Some(Range::new(char_start * bytes_per_char,
char_count * bytes_per_char))
}
InputType::InputText => Some(textinput.get_absolute_selection_range()),
_ => None
}
} }
#[allow(unrooted_must_root)] #[allow(unrooted_must_root)]

View file

@ -47,7 +47,7 @@ pub trait LayoutHTMLTextAreaElementHelpers {
#[allow(unsafe_code)] #[allow(unsafe_code)]
unsafe fn get_value_for_layout(self) -> String; unsafe fn get_value_for_layout(self) -> String;
#[allow(unsafe_code)] #[allow(unsafe_code)]
unsafe fn get_absolute_selection_for_layout(self) -> Option<Range<usize>>; unsafe fn selection_for_layout(self) -> Option<Range<usize>>;
#[allow(unsafe_code)] #[allow(unsafe_code)]
fn get_cols(self) -> u32; fn get_cols(self) -> u32;
#[allow(unsafe_code)] #[allow(unsafe_code)]
@ -63,13 +63,12 @@ impl LayoutHTMLTextAreaElementHelpers for LayoutJS<HTMLTextAreaElement> {
#[allow(unrooted_must_root)] #[allow(unrooted_must_root)]
#[allow(unsafe_code)] #[allow(unsafe_code)]
unsafe fn get_absolute_selection_for_layout(self) -> Option<Range<usize>> { unsafe fn selection_for_layout(self) -> Option<Range<usize>> {
if (*self.unsafe_get()).upcast::<Element>().focus_state() { if !(*self.unsafe_get()).upcast::<Element>().focus_state() {
Some((*self.unsafe_get()).textinput.borrow_for_layout() return None;
.get_absolute_selection_range())
} else {
None
} }
let textinput = (*self.unsafe_get()).textinput.borrow_for_layout();
Some(textinput.get_absolute_selection_range())
} }
#[allow(unsafe_code)] #[allow(unsafe_code)]

View file

@ -11,7 +11,7 @@ use std::ffi::CStr;
use std::fmt; use std::fmt;
use std::iter::{Filter, Peekable}; use std::iter::{Filter, Peekable};
use std::ops::{Deref, DerefMut}; use std::ops::{Deref, DerefMut};
use std::str::{Bytes, CharIndices, Split, from_utf8}; use std::str::{Bytes, Split, from_utf8};
use string_cache::Atom; use string_cache::Atom;
#[derive(Clone, Debug, Deserialize, Eq, Hash, HeapSizeOf, Ord, PartialEq, PartialOrd, Serialize)] #[derive(Clone, Debug, Deserialize, Eq, Hash, HeapSizeOf, Ord, PartialEq, PartialOrd, Serialize)]
@ -271,40 +271,3 @@ pub fn str_join<I, T>(strs: I, join: &str) -> String
acc acc
}) })
} }
// Lifted from Rust's StrExt implementation, which is being removed.
pub fn slice_chars(s: &str, begin: usize, end: usize) -> &str {
assert!(begin <= end);
let mut count = 0;
let mut begin_byte = None;
let mut end_byte = None;
// This could be even more efficient by not decoding,
// only finding the char boundaries
for (idx, _) in s.char_indices() {
if count == begin { begin_byte = Some(idx); }
if count == end { end_byte = Some(idx); break; }
count += 1;
}
if begin_byte.is_none() && count == begin { begin_byte = Some(s.len()) }
if end_byte.is_none() && count == end { end_byte = Some(s.len()) }
match (begin_byte, end_byte) {
(None, _) => panic!("slice_chars: `begin` is beyond end of string"),
(_, None) => panic!("slice_chars: `end` is beyond end of string"),
(Some(a), Some(b)) => unsafe { s.slice_unchecked(a, b) }
}
}
// searches a character index in CharIndices
// returns indices.count if not found
pub fn search_index(index: usize, indices: CharIndices) -> isize {
let mut character_count = 0;
for (character_index, _) in indices {
if character_index == index {
return character_count;
}
character_count += 1
}
character_count
}

View file

@ -2,7 +2,7 @@
* License, v. 2.0. If a copy of the MPL was not distributed with this * License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/. */ * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
use util::str::{search_index, split_html_space_chars, str_join}; use util::str::{split_html_space_chars, str_join};
#[test] #[test]
pub fn split_html_space_chars_whitespace() { pub fn split_html_space_chars_whitespace() {
@ -33,15 +33,3 @@ pub fn test_str_join_many() {
let expected = "-alpha--beta-gamma-"; let expected = "-alpha--beta-gamma-";
assert_eq!(actual, expected); assert_eq!(actual, expected);
} }
#[test]
pub fn test_search_index() {
let tuples = [("", 1, 0),
("foo", 8, 3),
("føo", 8, 3),
("foo", 2, 2),
("føo", 2, 3)];
for t in tuples.iter() {
assert_eq!(search_index(t.1, t.0.char_indices()), t.2);
};
}